diff --git "a/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" "b/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" --- "a/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" +++ "b/wandb/run-20220504_142129-w4rlzz90/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.4724, "train/learning_rate": 1.0702900088061256e-07, "train/epoch": 3.0, "train/global_step": 9720, "_runtime": 95217, "_timestamp": 1651769306, "_step": 9739, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 16.0, 47.0, 105.0, 194.0, 255.0, 200.0, 126.0, 40.0, 24.0, 5.0], "bins": [-38.22578811645508, -37.57297134399414, -36.9201545715332, -36.267337799072266, -35.61452102661133, -34.961700439453125, -34.30888366699219, -33.65606689453125, -33.00325012207031, -32.350433349609375, -31.697616577148438, -31.044797897338867, -30.39198112487793, -29.739164352416992, -29.086347579956055, -28.433530807495117, -27.78071403503418, -27.127897262573242, -26.475080490112305, -25.822261810302734, -25.169445037841797, -24.51662826538086, -23.863811492919922, -23.210994720458984, -22.558177947998047, -21.90536117553711, -21.252544403076172, -20.5997257232666, -19.946908950805664, -19.294092178344727, -18.64127540588379, -17.98845863342285, -17.33563804626465, -16.68282127380371, -16.030004501342773, -15.37718677520752, -14.724369049072266, -14.071552276611328, -13.41873550415039, -12.765918731689453, -12.1131010055542, -11.460284233093262, -10.807466506958008, -10.15464973449707, -9.501832962036133, -8.849015235900879, -8.196198463439941, -7.543381214141846, -6.89056396484375, -6.237746715545654, -5.584929466247559, -4.932112693786621, -4.279295444488525, -3.6264781951904297, -2.973661184310913, -2.3208441734313965, -1.6680269241333008, -1.0152097940444946, -0.3623926639556885, 0.2904244661331177, 0.9432415962219238, 1.5960588455200195, 2.248875856399536, 2.9016928672790527, 3.5545101165771484]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 9.0, 6.0, 5.0, 8.0, 10.0, 14.0, 12.0, 17.0, 19.0, 16.0, 30.0, 19.0, 19.0, 31.0, 38.0, 32.0, 37.0, 53.0, 43.0, 41.0, 36.0, 33.0, 34.0, 23.0, 42.0, 37.0, 39.0, 41.0, 31.0, 31.0, 25.0, 25.0, 24.0, 22.0, 15.0, 19.0, 16.0, 4.0, 10.0, 12.0, 5.0, 7.0, 4.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76909065246582, -5.58101749420166, -5.3929443359375, -5.204871654510498, -5.016798496246338, -4.828725337982178, -4.640652179718018, -4.452579498291016, -4.2645063400268555, -4.076433181762695, -3.8883602619171143, -3.700287103652954, -3.512214183807373, -3.324141025543213, -3.1360678672790527, -2.9479949474334717, -2.7599217891693115, -2.5718486309051514, -2.3837757110595703, -2.19570255279541, -2.007629632949829, -1.819556474685669, -1.6314834356307983, -1.4434103965759277, -1.2553373575210571, -1.0672643184661865, -0.8791912794113159, -0.6911181807518005, -0.5030451416969299, -0.3149721026420593, -0.12689900398254395, 0.06117403507232666, 0.24924707412719727, 0.43732011318206787, 0.6253931522369385, 0.8134662508964539, 1.0015392303466797, 1.1896123886108398, 1.3776854276657104, 1.565758466720581, 1.7538315057754517, 1.9419045448303223, 2.1299777030944824, 2.3180506229400635, 2.5061237812042236, 2.6941967010498047, 2.882269859313965, 3.070343017578125, 3.258415937423706, 3.446489095687866, 3.6345620155334473, 3.8226351737976074, 4.010708332061768, 4.1987810134887695, 4.38685417175293, 4.57492733001709, 4.76300048828125, 4.95107364654541, 5.13914680480957, 5.327219486236572, 5.515292644500732, 5.703365802764893, 5.891438961029053, 6.079511642456055, 6.267584800720215]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 8.0, 9.0, 17.0, 18.0, 18.0, 31.0, 47.0, 70.0, 99.0, 157.0, 276.0, 414.0, 723.0, 1148.0, 2051.0, 3603.0, 6965.0, 14656.0, 34925.0, 106300.0, 379896.0, 1294548.0, 1630173.0, 498712.0, 140514.0, 43605.0, 17353.0, 8163.0, 4141.0, 2187.0, 1342.0, 825.0, 437.0, 297.0, 172.0, 125.0, 59.0, 62.0, 25.0, 33.0, 19.0, 16.0, 14.0, 8.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.5, -11.141845703125, -10.78369140625, -10.425537109375, -10.0673828125, -9.709228515625, -9.35107421875, -8.992919921875, -8.634765625, -8.276611328125, -7.91845703125, -7.560302734375, -7.2021484375, -6.843994140625, -6.48583984375, -6.127685546875, -5.76953125, -5.411376953125, -5.05322265625, -4.695068359375, -4.3369140625, -3.978759765625, -3.62060546875, -3.262451171875, -2.904296875, -2.546142578125, -2.18798828125, -1.829833984375, -1.4716796875, -1.113525390625, -0.75537109375, -0.397216796875, -0.0390625, 0.319091796875, 0.67724609375, 1.035400390625, 1.3935546875, 1.751708984375, 2.10986328125, 2.468017578125, 2.826171875, 3.184326171875, 3.54248046875, 3.900634765625, 4.2587890625, 4.616943359375, 4.97509765625, 5.333251953125, 5.69140625, 6.049560546875, 6.40771484375, 6.765869140625, 7.1240234375, 7.482177734375, 7.84033203125, 8.198486328125, 8.556640625, 8.914794921875, 9.27294921875, 9.631103515625, 9.9892578125, 10.347412109375, 10.70556640625, 11.063720703125, 11.421875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 6.0, 4.0, 3.0, 2.0, 7.0, 10.0, 14.0, 11.0, 23.0, 12.0, 12.0, 32.0, 24.0, 16.0, 18.0, 32.0, 21.0, 33.0, 36.0, 34.0, 43.0, 37.0, 40.0, 36.0, 29.0, 42.0, 41.0, 30.0, 34.0, 30.0, 36.0, 31.0, 20.0, 28.0, 22.0, 28.0, 12.0, 18.0, 17.0, 11.0, 12.0, 13.0, 9.0, 12.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.90625, -8.6258544921875, -8.345458984375, -8.0650634765625, -7.78466796875, -7.5042724609375, -7.223876953125, -6.9434814453125, -6.6630859375, -6.3826904296875, -6.102294921875, -5.8218994140625, -5.54150390625, -5.2611083984375, -4.980712890625, -4.7003173828125, -4.419921875, -4.1395263671875, -3.859130859375, -3.5787353515625, -3.29833984375, -3.0179443359375, -2.737548828125, -2.4571533203125, -2.1767578125, -1.8963623046875, -1.615966796875, -1.3355712890625, -1.05517578125, -0.7747802734375, -0.494384765625, -0.2139892578125, 0.06640625, 0.3468017578125, 0.627197265625, 0.9075927734375, 1.18798828125, 1.4683837890625, 1.748779296875, 2.0291748046875, 2.3095703125, 2.5899658203125, 2.870361328125, 3.1507568359375, 3.43115234375, 3.7115478515625, 3.991943359375, 4.2723388671875, 4.552734375, 4.8331298828125, 5.113525390625, 5.3939208984375, 5.67431640625, 5.9547119140625, 6.235107421875, 6.5155029296875, 6.7958984375, 7.0762939453125, 7.356689453125, 7.6370849609375, 7.91748046875, 8.1978759765625, 8.478271484375, 8.7586669921875, 9.0390625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 11.0, 18.0, 23.0, 48.0, 42.0, 73.0, 99.0, 137.0, 238.0, 620.0, 18574.0, 4170474.0, 2838.0, 468.0, 214.0, 125.0, 79.0, 69.0, 34.0, 21.0, 14.0, 10.0, 6.0, 8.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-117.5, -113.3515625, -109.203125, -105.0546875, -100.90625, -96.7578125, -92.609375, -88.4609375, -84.3125, -80.1640625, -76.015625, -71.8671875, -67.71875, -63.5703125, -59.421875, -55.2734375, -51.125, -46.9765625, -42.828125, -38.6796875, -34.53125, -30.3828125, -26.234375, -22.0859375, -17.9375, -13.7890625, -9.640625, -5.4921875, -1.34375, 2.8046875, 6.953125, 11.1015625, 15.25, 19.3984375, 23.546875, 27.6953125, 31.84375, 35.9921875, 40.140625, 44.2890625, 48.4375, 52.5859375, 56.734375, 60.8828125, 65.03125, 69.1796875, 73.328125, 77.4765625, 81.625, 85.7734375, 89.921875, 94.0703125, 98.21875, 102.3671875, 106.515625, 110.6640625, 114.8125, 118.9609375, 123.109375, 127.2578125, 131.40625, 135.5546875, 139.703125, 143.8515625, 148.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 19.0, 16.0, 24.0, 36.0, 45.0, 55.0, 84.0, 113.0, 144.0, 234.0, 412.0, 850.0, 769.0, 452.0, 251.0, 163.0, 112.0, 80.0, 45.0, 39.0, 34.0, 21.0, 8.0, 11.0, 2.0, 6.0, 6.0, 7.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.49609375, -4.341064453125, -4.18603515625, -4.031005859375, -3.8759765625, -3.720947265625, -3.56591796875, -3.410888671875, -3.255859375, -3.100830078125, -2.94580078125, -2.790771484375, -2.6357421875, -2.480712890625, -2.32568359375, -2.170654296875, -2.015625, -1.860595703125, -1.70556640625, -1.550537109375, -1.3955078125, -1.240478515625, -1.08544921875, -0.930419921875, -0.775390625, -0.620361328125, -0.46533203125, -0.310302734375, -0.1552734375, -0.000244140625, 0.15478515625, 0.309814453125, 0.46484375, 0.619873046875, 0.77490234375, 0.929931640625, 1.0849609375, 1.239990234375, 1.39501953125, 1.550048828125, 1.705078125, 1.860107421875, 2.01513671875, 2.170166015625, 2.3251953125, 2.480224609375, 2.63525390625, 2.790283203125, 2.9453125, 3.100341796875, 3.25537109375, 3.410400390625, 3.5654296875, 3.720458984375, 3.87548828125, 4.030517578125, 4.185546875, 4.340576171875, 4.49560546875, 4.650634765625, 4.8056640625, 4.960693359375, 5.11572265625, 5.270751953125, 5.42578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 5.0, 8.0, 7.0, 11.0, 15.0, 19.0, 28.0, 28.0, 27.0, 29.0, 45.0, 48.0, 52.0, 56.0, 53.0, 63.0, 54.0, 62.0, 66.0, 53.0, 46.0, 48.0, 30.0, 35.0, 24.0, 17.0, 16.0, 10.0, 12.0, 5.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.173274040222168, -13.798551559448242, -13.423830032348633, -13.049107551574707, -12.674386024475098, -12.299663543701172, -11.924942016601562, -11.550219535827637, -11.175497055053711, -10.800774574279785, -10.426053047180176, -10.05133056640625, -9.67660903930664, -9.301886558532715, -8.927164077758789, -8.55244255065918, -8.17772102355957, -7.802999019622803, -7.428277015686035, -7.053554534912109, -6.6788330078125, -6.304110527038574, -5.929388523101807, -5.554666519165039, -5.1799445152282715, -4.805222511291504, -4.430500507354736, -4.055778503417969, -3.681056261062622, -3.3063342571258545, -2.931612014770508, -2.5568900108337402, -2.1821680068969727, -1.807446002960205, -1.432723879814148, -1.0580017566680908, -0.6832797527313232, -0.30855774879455566, 0.06616449356079102, 0.4408864974975586, 0.8156085014343262, 1.1903305053710938, 1.5650526285171509, 1.939774751663208, 2.3144967555999756, 2.689218759536743, 3.06394100189209, 3.4386630058288574, 3.813385009765625, 4.188107013702393, 4.56282901763916, 4.937551498413086, 5.312273025512695, 5.686995506286621, 6.061717510223389, 6.436439514160156, 6.811161518096924, 7.185883522033691, 7.560605525970459, 7.935327529907227, 8.310050010681152, 8.684771537780762, 9.059494018554688, 9.434215545654297, 9.808938026428223]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 2.0, 3.0, 5.0, 7.0, 12.0, 6.0, 10.0, 16.0, 13.0, 16.0, 18.0, 35.0, 27.0, 28.0, 35.0, 31.0, 35.0, 43.0, 48.0, 45.0, 43.0, 31.0, 52.0, 41.0, 26.0, 42.0, 35.0, 46.0, 31.0, 42.0, 28.0, 33.0, 17.0, 16.0, 15.0, 19.0, 14.0, 8.0, 9.0, 5.0, 9.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.746149063110352, -9.437788009643555, -9.129427909851074, -8.821066856384277, -8.512706756591797, -8.204345703125, -7.895984649658203, -7.5876240730285645, -7.279263496398926, -6.970902919769287, -6.662542343139648, -6.354181289672852, -6.045820713043213, -5.737460136413574, -5.429099082946777, -5.120738506317139, -4.8123779296875, -4.504017353057861, -4.195656776428223, -3.887295722961426, -3.578935146331787, -3.2705745697021484, -2.9622137546539307, -2.653852939605713, -2.345492362976074, -2.0371317863464355, -1.7287709712982178, -1.4204102754592896, -1.1120495796203613, -0.8036888837814331, -0.4953281879425049, -0.1869673728942871, 0.12139415740966797, 0.4297548532485962, 0.7381155490875244, 1.0464762449264526, 1.3548369407653809, 1.663197636604309, 1.9715583324432373, 2.279919147491455, 2.5882797241210938, 2.8966403007507324, 3.20500111579895, 3.513361930847168, 3.8217225074768066, 4.130083084106445, 4.438444137573242, 4.746804714202881, 5.0551652908325195, 5.363525867462158, 5.671886444091797, 5.980247497558594, 6.288608074188232, 6.596968650817871, 6.905329704284668, 7.213690280914307, 7.522050857543945, 7.830411434173584, 8.138772010803223, 8.44713306427002, 8.7554931640625, 9.063854217529297, 9.372215270996094, 9.68057632446289, 9.988936424255371]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 13.0, 10.0, 17.0, 34.0, 48.0, 69.0, 69.0, 109.0, 173.0, 272.0, 424.0, 607.0, 862.0, 1416.0, 2363.0, 3829.0, 6094.0, 10338.0, 17723.0, 31559.0, 56514.0, 101473.0, 170361.0, 219748.0, 177480.0, 106740.0, 60252.0, 33143.0, 18789.0, 10940.0, 6493.0, 3832.0, 2358.0, 1513.0, 958.0, 587.0, 442.0, 289.0, 194.0, 126.0, 100.0, 49.0, 37.0, 34.0, 18.0, 15.0, 14.0, 4.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.71875, -2.632568359375, -2.54638671875, -2.460205078125, -2.3740234375, -2.287841796875, -2.20166015625, -2.115478515625, -2.029296875, -1.943115234375, -1.85693359375, -1.770751953125, -1.6845703125, -1.598388671875, -1.51220703125, -1.426025390625, -1.33984375, -1.253662109375, -1.16748046875, -1.081298828125, -0.9951171875, -0.908935546875, -0.82275390625, -0.736572265625, -0.650390625, -0.564208984375, -0.47802734375, -0.391845703125, -0.3056640625, -0.219482421875, -0.13330078125, -0.047119140625, 0.0390625, 0.125244140625, 0.21142578125, 0.297607421875, 0.3837890625, 0.469970703125, 0.55615234375, 0.642333984375, 0.728515625, 0.814697265625, 0.90087890625, 0.987060546875, 1.0732421875, 1.159423828125, 1.24560546875, 1.331787109375, 1.41796875, 1.504150390625, 1.59033203125, 1.676513671875, 1.7626953125, 1.848876953125, 1.93505859375, 2.021240234375, 2.107421875, 2.193603515625, 2.27978515625, 2.365966796875, 2.4521484375, 2.538330078125, 2.62451171875, 2.710693359375, 2.796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 8.0, 5.0, 6.0, 6.0, 9.0, 8.0, 9.0, 15.0, 18.0, 17.0, 24.0, 28.0, 27.0, 33.0, 29.0, 43.0, 38.0, 46.0, 46.0, 40.0, 49.0, 52.0, 34.0, 41.0, 53.0, 38.0, 34.0, 29.0, 34.0, 27.0, 26.0, 26.0, 14.0, 21.0, 22.0, 14.0, 8.0, 6.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1953125, -7.952880859375, -7.71044921875, -7.468017578125, -7.2255859375, -6.983154296875, -6.74072265625, -6.498291015625, -6.255859375, -6.013427734375, -5.77099609375, -5.528564453125, -5.2861328125, -5.043701171875, -4.80126953125, -4.558837890625, -4.31640625, -4.073974609375, -3.83154296875, -3.589111328125, -3.3466796875, -3.104248046875, -2.86181640625, -2.619384765625, -2.376953125, -2.134521484375, -1.89208984375, -1.649658203125, -1.4072265625, -1.164794921875, -0.92236328125, -0.679931640625, -0.4375, -0.195068359375, 0.04736328125, 0.289794921875, 0.5322265625, 0.774658203125, 1.01708984375, 1.259521484375, 1.501953125, 1.744384765625, 1.98681640625, 2.229248046875, 2.4716796875, 2.714111328125, 2.95654296875, 3.198974609375, 3.44140625, 3.683837890625, 3.92626953125, 4.168701171875, 4.4111328125, 4.653564453125, 4.89599609375, 5.138427734375, 5.380859375, 5.623291015625, 5.86572265625, 6.108154296875, 6.3505859375, 6.593017578125, 6.83544921875, 7.077880859375, 7.3203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 3.0, 3.0, 0.0, 8.0, 6.0, 14.0, 15.0, 17.0, 35.0, 50.0, 62.0, 113.0, 156.0, 259.0, 506.0, 958.0, 2030.0, 5022.0, 13933.0, 46541.0, 185909.0, 478767.0, 230140.0, 56987.0, 16715.0, 5674.0, 2267.0, 1052.0, 530.0, 281.0, 183.0, 103.0, 75.0, 49.0, 22.0, 14.0, 19.0, 8.0, 8.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.91015625, -4.744140625, -4.578125, -4.412109375, -4.24609375, -4.080078125, -3.9140625, -3.748046875, -3.58203125, -3.416015625, -3.25, -3.083984375, -2.91796875, -2.751953125, -2.5859375, -2.419921875, -2.25390625, -2.087890625, -1.921875, -1.755859375, -1.58984375, -1.423828125, -1.2578125, -1.091796875, -0.92578125, -0.759765625, -0.59375, -0.427734375, -0.26171875, -0.095703125, 0.0703125, 0.236328125, 0.40234375, 0.568359375, 0.734375, 0.900390625, 1.06640625, 1.232421875, 1.3984375, 1.564453125, 1.73046875, 1.896484375, 2.0625, 2.228515625, 2.39453125, 2.560546875, 2.7265625, 2.892578125, 3.05859375, 3.224609375, 3.390625, 3.556640625, 3.72265625, 3.888671875, 4.0546875, 4.220703125, 4.38671875, 4.552734375, 4.71875, 4.884765625, 5.05078125, 5.216796875, 5.3828125, 5.548828125, 5.71484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 11.0, 11.0, 10.0, 10.0, 19.0, 11.0, 26.0, 16.0, 28.0, 19.0, 22.0, 34.0, 28.0, 27.0, 40.0, 59.0, 35.0, 36.0, 39.0, 42.0, 40.0, 51.0, 47.0, 34.0, 36.0, 34.0, 14.0, 23.0, 26.0, 19.0, 14.0, 19.0, 18.0, 14.0, 14.0, 13.0, 9.0, 7.0, 8.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.4140625, -13.9561767578125, -13.498291015625, -13.0404052734375, -12.58251953125, -12.1246337890625, -11.666748046875, -11.2088623046875, -10.7509765625, -10.2930908203125, -9.835205078125, -9.3773193359375, -8.91943359375, -8.4615478515625, -8.003662109375, -7.5457763671875, -7.087890625, -6.6300048828125, -6.172119140625, -5.7142333984375, -5.25634765625, -4.7984619140625, -4.340576171875, -3.8826904296875, -3.4248046875, -2.9669189453125, -2.509033203125, -2.0511474609375, -1.59326171875, -1.1353759765625, -0.677490234375, -0.2196044921875, 0.23828125, 0.6961669921875, 1.154052734375, 1.6119384765625, 2.06982421875, 2.5277099609375, 2.985595703125, 3.4434814453125, 3.9013671875, 4.3592529296875, 4.817138671875, 5.2750244140625, 5.73291015625, 6.1907958984375, 6.648681640625, 7.1065673828125, 7.564453125, 8.0223388671875, 8.480224609375, 8.9381103515625, 9.39599609375, 9.8538818359375, 10.311767578125, 10.7696533203125, 11.2275390625, 11.6854248046875, 12.143310546875, 12.6011962890625, 13.05908203125, 13.5169677734375, 13.974853515625, 14.4327392578125, 14.890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 18.0, 21.0, 34.0, 38.0, 59.0, 102.0, 144.0, 243.0, 362.0, 614.0, 1024.0, 1783.0, 3681.0, 8376.0, 24262.0, 121422.0, 673662.0, 164770.0, 29275.0, 9639.0, 4108.0, 2035.0, 1062.0, 647.0, 396.0, 249.0, 158.0, 97.0, 69.0, 46.0, 37.0, 29.0, 20.0, 20.0, 7.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.296875, -3.18902587890625, -3.0811767578125, -2.97332763671875, -2.865478515625, -2.75762939453125, -2.6497802734375, -2.54193115234375, -2.43408203125, -2.32623291015625, -2.2183837890625, -2.11053466796875, -2.002685546875, -1.89483642578125, -1.7869873046875, -1.67913818359375, -1.5712890625, -1.46343994140625, -1.3555908203125, -1.24774169921875, -1.139892578125, -1.03204345703125, -0.9241943359375, -0.81634521484375, -0.70849609375, -0.60064697265625, -0.4927978515625, -0.38494873046875, -0.277099609375, -0.16925048828125, -0.0614013671875, 0.04644775390625, 0.154296875, 0.26214599609375, 0.3699951171875, 0.47784423828125, 0.585693359375, 0.69354248046875, 0.8013916015625, 0.90924072265625, 1.01708984375, 1.12493896484375, 1.2327880859375, 1.34063720703125, 1.448486328125, 1.55633544921875, 1.6641845703125, 1.77203369140625, 1.8798828125, 1.98773193359375, 2.0955810546875, 2.20343017578125, 2.311279296875, 2.41912841796875, 2.5269775390625, 2.63482666015625, 2.74267578125, 2.85052490234375, 2.9583740234375, 3.06622314453125, 3.174072265625, 3.28192138671875, 3.3897705078125, 3.49761962890625, 3.60546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 10.0, 19.0, 19.0, 33.0, 55.0, 115.0, 132.0, 160.0, 154.0, 113.0, 59.0, 29.0, 18.0, 17.0, 12.0, 7.0, 9.0, 2.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002132415771484375, -0.002070903778076172, -0.0020093917846679688, -0.0019478797912597656, -0.0018863677978515625, -0.0018248558044433594, -0.0017633438110351562, -0.0017018318176269531, -0.00164031982421875, -0.0015788078308105469, -0.0015172958374023438, -0.0014557838439941406, -0.0013942718505859375, -0.0013327598571777344, -0.0012712478637695312, -0.0012097358703613281, -0.001148223876953125, -0.0010867118835449219, -0.0010251998901367188, -0.0009636878967285156, -0.0009021759033203125, -0.0008406639099121094, -0.0007791519165039062, -0.0007176399230957031, -0.0006561279296875, -0.0005946159362792969, -0.0005331039428710938, -0.0004715919494628906, -0.0004100799560546875, -0.0003485679626464844, -0.00028705596923828125, -0.00022554397583007812, -0.000164031982421875, -0.00010251998901367188, -4.100799560546875e-05, 2.0503997802734375e-05, 8.20159912109375e-05, 0.00014352798461914062, 0.00020503997802734375, 0.0002665519714355469, 0.00032806396484375, 0.0003895759582519531, 0.00045108795166015625, 0.0005125999450683594, 0.0005741119384765625, 0.0006356239318847656, 0.0006971359252929688, 0.0007586479187011719, 0.000820159912109375, 0.0008816719055175781, 0.0009431838989257812, 0.0010046958923339844, 0.0010662078857421875, 0.0011277198791503906, 0.0011892318725585938, 0.0012507438659667969, 0.001312255859375, 0.0013737678527832031, 0.0014352798461914062, 0.0014967918395996094, 0.0015583038330078125, 0.0016198158264160156, 0.0016813278198242188, 0.0017428398132324219, 0.001804351806640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 8.0, 9.0, 11.0, 10.0, 28.0, 49.0, 101.0, 242.0, 579.0, 2079.0, 11848.0, 477005.0, 540771.0, 12604.0, 2155.0, 590.0, 226.0, 91.0, 40.0, 28.0, 19.0, 11.0, 8.0, 6.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8984375, -9.607421875, -9.31640625, -9.025390625, -8.734375, -8.443359375, -8.15234375, -7.861328125, -7.5703125, -7.279296875, -6.98828125, -6.697265625, -6.40625, -6.115234375, -5.82421875, -5.533203125, -5.2421875, -4.951171875, -4.66015625, -4.369140625, -4.078125, -3.787109375, -3.49609375, -3.205078125, -2.9140625, -2.623046875, -2.33203125, -2.041015625, -1.75, -1.458984375, -1.16796875, -0.876953125, -0.5859375, -0.294921875, -0.00390625, 0.287109375, 0.578125, 0.869140625, 1.16015625, 1.451171875, 1.7421875, 2.033203125, 2.32421875, 2.615234375, 2.90625, 3.197265625, 3.48828125, 3.779296875, 4.0703125, 4.361328125, 4.65234375, 4.943359375, 5.234375, 5.525390625, 5.81640625, 6.107421875, 6.3984375, 6.689453125, 6.98046875, 7.271484375, 7.5625, 7.853515625, 8.14453125, 8.435546875, 8.7265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 3.0, 4.0, 5.0, 11.0, 5.0, 15.0, 24.0, 27.0, 45.0, 58.0, 87.0, 107.0, 130.0, 126.0, 82.0, 77.0, 54.0, 34.0, 22.0, 19.0, 13.0, 12.0, 12.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.177734375, -1.1428985595703125, -1.108062744140625, -1.0732269287109375, -1.03839111328125, -1.0035552978515625, -0.968719482421875, -0.9338836669921875, -0.8990478515625, -0.8642120361328125, -0.829376220703125, -0.7945404052734375, -0.75970458984375, -0.7248687744140625, -0.690032958984375, -0.6551971435546875, -0.620361328125, -0.5855255126953125, -0.550689697265625, -0.5158538818359375, -0.48101806640625, -0.4461822509765625, -0.411346435546875, -0.3765106201171875, -0.3416748046875, -0.3068389892578125, -0.272003173828125, -0.2371673583984375, -0.20233154296875, -0.1674957275390625, -0.132659912109375, -0.0978240966796875, -0.06298828125, -0.0281524658203125, 0.006683349609375, 0.0415191650390625, 0.07635498046875, 0.1111907958984375, 0.146026611328125, 0.1808624267578125, 0.2156982421875, 0.2505340576171875, 0.285369873046875, 0.3202056884765625, 0.35504150390625, 0.3898773193359375, 0.424713134765625, 0.4595489501953125, 0.494384765625, 0.5292205810546875, 0.564056396484375, 0.5988922119140625, 0.63372802734375, 0.6685638427734375, 0.703399658203125, 0.7382354736328125, 0.7730712890625, 0.8079071044921875, 0.842742919921875, 0.8775787353515625, 0.91241455078125, 0.9472503662109375, 0.982086181640625, 1.0169219970703125, 1.0517578125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 6.0, 10.0, 14.0, 23.0, 33.0, 33.0, 43.0, 60.0, 62.0, 79.0, 80.0, 94.0, 100.0, 72.0, 78.0, 53.0, 52.0, 31.0, 20.0, 12.0, 10.0, 11.0, 11.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.561897277832031, -14.15044116973877, -13.738984107971191, -13.32752799987793, -12.916071891784668, -12.504615783691406, -12.093158721923828, -11.681702613830566, -11.270246505737305, -10.858790397644043, -10.447333335876465, -10.035877227783203, -9.624421119689941, -9.21296501159668, -8.801507949829102, -8.39005184173584, -7.978594779968262, -7.567138195037842, -7.15568208694458, -6.74422550201416, -6.332769393920898, -5.9213128089904785, -5.509856224060059, -5.098400115966797, -4.686943531036377, -4.275486946105957, -3.8640308380126953, -3.4525742530822754, -3.0411179065704346, -2.6296615600585938, -2.218204975128174, -1.806748628616333, -1.3952922821044922, -0.9838358759880066, -0.572379469871521, -0.16092300415039062, 0.2505333423614502, 0.661989688873291, 1.073446273803711, 1.4849026203155518, 1.8963589668273926, 2.3078153133392334, 2.719271659851074, 3.130728244781494, 3.542184591293335, 3.953640937805176, 4.365097522735596, 4.776554107666016, 5.188010215759277, 5.599466800689697, 6.010922908782959, 6.422379493713379, 6.833835601806641, 7.2452921867370605, 7.6567487716674805, 8.068204879760742, 8.47966194152832, 8.891118049621582, 9.30257511138916, 9.714031219482422, 10.125487327575684, 10.536943435668945, 10.948400497436523, 11.359856605529785, 11.771312713623047]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 1.0, 5.0, 9.0, 7.0, 8.0, 8.0, 21.0, 13.0, 18.0, 15.0, 17.0, 24.0, 29.0, 38.0, 37.0, 40.0, 42.0, 39.0, 44.0, 44.0, 39.0, 44.0, 31.0, 44.0, 47.0, 27.0, 41.0, 24.0, 28.0, 26.0, 25.0, 30.0, 27.0, 23.0, 14.0, 14.0, 15.0, 9.0, 9.0, 2.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-8.162459373474121, -7.934866905212402, -7.707274436950684, -7.479681968688965, -7.252089500427246, -7.024497032165527, -6.796904563903809, -6.56931209564209, -6.341719627380371, -6.114127159118652, -5.886534690856934, -5.658942222595215, -5.431349754333496, -5.203757286071777, -4.976164817810059, -4.74857234954834, -4.520979404449463, -4.293386936187744, -4.065794467926025, -3.8382019996643066, -3.610609531402588, -3.383017063140869, -3.1554243564605713, -2.9278318881988525, -2.700239419937134, -2.472646951675415, -2.2450544834136963, -2.0174617767333984, -1.7898694276809692, -1.5622769594192505, -1.3346843719482422, -1.1070919036865234, -0.8794999122619629, -0.6519074440002441, -0.4243149161338806, -0.1967223882675171, 0.03087007999420166, 0.2584625482559204, 0.4860551357269287, 0.7136476039886475, 0.9412400722503662, 1.168832540512085, 1.3964250087738037, 1.624017596244812, 1.8516100645065308, 2.079202651977539, 2.306795120239258, 2.5343875885009766, 2.7619800567626953, 2.989572525024414, 3.217164993286133, 3.4447574615478516, 3.6723499298095703, 3.899942398071289, 4.127534866333008, 4.355127334594727, 4.582719802856445, 4.810312271118164, 5.037904739379883, 5.265497207641602, 5.49308967590332, 5.720682144165039, 5.948274612426758, 6.175867080688477, 6.4034600257873535]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 17.0, 27.0, 32.0, 38.0, 57.0, 96.0, 140.0, 206.0, 341.0, 539.0, 747.0, 1249.0, 2005.0, 3461.0, 5717.0, 10641.0, 19195.0, 37143.0, 72578.0, 144733.0, 239762.0, 230689.0, 135121.0, 67913.0, 34534.0, 17872.0, 9654.0, 5435.0, 3201.0, 1984.0, 1189.0, 746.0, 512.0, 315.0, 206.0, 152.0, 107.0, 51.0, 41.0, 26.0, 20.0, 13.0, 8.0, 3.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.6953125, -3.586456298828125, -3.47760009765625, -3.368743896484375, -3.2598876953125, -3.151031494140625, -3.04217529296875, -2.933319091796875, -2.824462890625, -2.715606689453125, -2.60675048828125, -2.497894287109375, -2.3890380859375, -2.280181884765625, -2.17132568359375, -2.062469482421875, -1.95361328125, -1.844757080078125, -1.73590087890625, -1.627044677734375, -1.5181884765625, -1.409332275390625, -1.30047607421875, -1.191619873046875, -1.082763671875, -0.973907470703125, -0.86505126953125, -0.756195068359375, -0.6473388671875, -0.538482666015625, -0.42962646484375, -0.320770263671875, -0.2119140625, -0.103057861328125, 0.00579833984375, 0.114654541015625, 0.2235107421875, 0.332366943359375, 0.44122314453125, 0.550079345703125, 0.658935546875, 0.767791748046875, 0.87664794921875, 0.985504150390625, 1.0943603515625, 1.203216552734375, 1.31207275390625, 1.420928955078125, 1.52978515625, 1.638641357421875, 1.74749755859375, 1.856353759765625, 1.9652099609375, 2.074066162109375, 2.18292236328125, 2.291778564453125, 2.400634765625, 2.509490966796875, 2.61834716796875, 2.727203369140625, 2.8360595703125, 2.944915771484375, 3.05377197265625, 3.162628173828125, 3.271484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 7.0, 5.0, 9.0, 10.0, 11.0, 24.0, 17.0, 11.0, 24.0, 28.0, 15.0, 30.0, 38.0, 35.0, 37.0, 31.0, 34.0, 47.0, 44.0, 40.0, 41.0, 39.0, 51.0, 38.0, 30.0, 34.0, 36.0, 36.0, 31.0, 30.0, 26.0, 13.0, 16.0, 18.0, 11.0, 10.0, 7.0, 6.0, 3.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-37.125, -36.01220703125, -34.8994140625, -33.78662109375, -32.673828125, -31.56103515625, -30.4482421875, -29.33544921875, -28.22265625, -27.10986328125, -25.9970703125, -24.88427734375, -23.771484375, -22.65869140625, -21.5458984375, -20.43310546875, -19.3203125, -18.20751953125, -17.0947265625, -15.98193359375, -14.869140625, -13.75634765625, -12.6435546875, -11.53076171875, -10.41796875, -9.30517578125, -8.1923828125, -7.07958984375, -5.966796875, -4.85400390625, -3.7412109375, -2.62841796875, -1.515625, -0.40283203125, 0.7099609375, 1.82275390625, 2.935546875, 4.04833984375, 5.1611328125, 6.27392578125, 7.38671875, 8.49951171875, 9.6123046875, 10.72509765625, 11.837890625, 12.95068359375, 14.0634765625, 15.17626953125, 16.2890625, 17.40185546875, 18.5146484375, 19.62744140625, 20.740234375, 21.85302734375, 22.9658203125, 24.07861328125, 25.19140625, 26.30419921875, 27.4169921875, 28.52978515625, 29.642578125, 30.75537109375, 31.8681640625, 32.98095703125, 34.09375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 8.0, 13.0, 16.0, 20.0, 18.0, 27.0, 34.0, 44.0, 62.0, 94.0, 116.0, 156.0, 249.0, 490.0, 1400.0, 13838.0, 576730.0, 442505.0, 10173.0, 1153.0, 477.0, 274.0, 162.0, 111.0, 78.0, 51.0, 52.0, 37.0, 39.0, 34.0, 20.0, 24.0, 10.0, 11.0, 8.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.237060546875, -16.66162109375, -16.086181640625, -15.5107421875, -14.935302734375, -14.35986328125, -13.784423828125, -13.208984375, -12.633544921875, -12.05810546875, -11.482666015625, -10.9072265625, -10.331787109375, -9.75634765625, -9.180908203125, -8.60546875, -8.030029296875, -7.45458984375, -6.879150390625, -6.3037109375, -5.728271484375, -5.15283203125, -4.577392578125, -4.001953125, -3.426513671875, -2.85107421875, -2.275634765625, -1.7001953125, -1.124755859375, -0.54931640625, 0.026123046875, 0.6015625, 1.177001953125, 1.75244140625, 2.327880859375, 2.9033203125, 3.478759765625, 4.05419921875, 4.629638671875, 5.205078125, 5.780517578125, 6.35595703125, 6.931396484375, 7.5068359375, 8.082275390625, 8.65771484375, 9.233154296875, 9.80859375, 10.384033203125, 10.95947265625, 11.534912109375, 12.1103515625, 12.685791015625, 13.26123046875, 13.836669921875, 14.412109375, 14.987548828125, 15.56298828125, 16.138427734375, 16.7138671875, 17.289306640625, 17.86474609375, 18.440185546875, 19.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 4.0, 15.0, 11.0, 17.0, 19.0, 33.0, 30.0, 29.0, 34.0, 40.0, 46.0, 63.0, 51.0, 54.0, 43.0, 66.0, 54.0, 52.0, 48.0, 52.0, 37.0, 27.0, 18.0, 31.0, 17.0, 15.0, 15.0, 19.0, 12.0, 11.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71875, -36.48583984375, -35.2529296875, -34.02001953125, -32.787109375, -31.55419921875, -30.3212890625, -29.08837890625, -27.85546875, -26.62255859375, -25.3896484375, -24.15673828125, -22.923828125, -21.69091796875, -20.4580078125, -19.22509765625, -17.9921875, -16.75927734375, -15.5263671875, -14.29345703125, -13.060546875, -11.82763671875, -10.5947265625, -9.36181640625, -8.12890625, -6.89599609375, -5.6630859375, -4.43017578125, -3.197265625, -1.96435546875, -0.7314453125, 0.50146484375, 1.734375, 2.96728515625, 4.2001953125, 5.43310546875, 6.666015625, 7.89892578125, 9.1318359375, 10.36474609375, 11.59765625, 12.83056640625, 14.0634765625, 15.29638671875, 16.529296875, 17.76220703125, 18.9951171875, 20.22802734375, 21.4609375, 22.69384765625, 23.9267578125, 25.15966796875, 26.392578125, 27.62548828125, 28.8583984375, 30.09130859375, 31.32421875, 32.55712890625, 33.7900390625, 35.02294921875, 36.255859375, 37.48876953125, 38.7216796875, 39.95458984375, 41.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 2.0, 10.0, 11.0, 17.0, 35.0, 25.0, 49.0, 69.0, 92.0, 171.0, 307.0, 527.0, 1070.0, 2483.0, 6270.0, 18610.0, 94102.0, 704972.0, 177806.0, 27536.0, 8239.0, 3047.0, 1352.0, 689.0, 379.0, 236.0, 137.0, 73.0, 57.0, 48.0, 28.0, 21.0, 13.0, 12.0, 9.0, 15.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5478515625, -1.495635986328125, -1.44342041015625, -1.391204833984375, -1.3389892578125, -1.286773681640625, -1.23455810546875, -1.182342529296875, -1.130126953125, -1.077911376953125, -1.02569580078125, -0.973480224609375, -0.9212646484375, -0.869049072265625, -0.81683349609375, -0.764617919921875, -0.71240234375, -0.660186767578125, -0.60797119140625, -0.555755615234375, -0.5035400390625, -0.451324462890625, -0.39910888671875, -0.346893310546875, -0.294677734375, -0.242462158203125, -0.19024658203125, -0.138031005859375, -0.0858154296875, -0.033599853515625, 0.01861572265625, 0.070831298828125, 0.123046875, 0.175262451171875, 0.22747802734375, 0.279693603515625, 0.3319091796875, 0.384124755859375, 0.43634033203125, 0.488555908203125, 0.540771484375, 0.592987060546875, 0.64520263671875, 0.697418212890625, 0.7496337890625, 0.801849365234375, 0.85406494140625, 0.906280517578125, 0.95849609375, 1.010711669921875, 1.06292724609375, 1.115142822265625, 1.1673583984375, 1.219573974609375, 1.27178955078125, 1.324005126953125, 1.376220703125, 1.428436279296875, 1.48065185546875, 1.532867431640625, 1.5850830078125, 1.637298583984375, 1.68951416015625, 1.741729736328125, 1.7939453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 4.0, 5.0, 5.0, 18.0, 25.0, 20.0, 36.0, 57.0, 73.0, 143.0, 173.0, 133.0, 93.0, 65.0, 43.0, 28.0, 19.0, 11.0, 6.0, 9.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003361701965332031, -0.00032558292150497437, -0.0003149956464767456, -0.00030440837144851685, -0.0002938210964202881, -0.0002832338213920593, -0.00027264654636383057, -0.0002620592713356018, -0.00025147199630737305, -0.0002408847212791443, -0.00023029744625091553, -0.00021971017122268677, -0.000209122896194458, -0.00019853562116622925, -0.0001879483461380005, -0.00017736107110977173, -0.00016677379608154297, -0.0001561865210533142, -0.00014559924602508545, -0.0001350119709968567, -0.00012442469596862793, -0.00011383742094039917, -0.00010325014591217041, -9.266287088394165e-05, -8.207559585571289e-05, -7.148832082748413e-05, -6.090104579925537e-05, -5.031377077102661e-05, -3.972649574279785e-05, -2.9139220714569092e-05, -1.8551945686340332e-05, -7.964670658111572e-06, 2.6226043701171875e-06, 1.3209879398345947e-05, 2.3797154426574707e-05, 3.438442945480347e-05, 4.4971704483032227e-05, 5.5558979511260986e-05, 6.614625453948975e-05, 7.67335295677185e-05, 8.732080459594727e-05, 9.790807962417603e-05, 0.00010849535465240479, 0.00011908262968063354, 0.0001296699047088623, 0.00014025717973709106, 0.00015084445476531982, 0.00016143172979354858, 0.00017201900482177734, 0.0001826062798500061, 0.00019319355487823486, 0.00020378082990646362, 0.00021436810493469238, 0.00022495537996292114, 0.0002355426549911499, 0.00024612993001937866, 0.0002567172050476074, 0.0002673044800758362, 0.00027789175510406494, 0.0002884790301322937, 0.00029906630516052246, 0.0003096535801887512, 0.00032024085521698, 0.00033082813024520874, 0.0003414154052734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 8.0, 9.0, 10.0, 13.0, 19.0, 26.0, 43.0, 47.0, 57.0, 101.0, 148.0, 244.0, 451.0, 771.0, 1349.0, 2649.0, 5686.0, 14124.0, 42669.0, 237272.0, 616950.0, 86488.0, 22718.0, 8582.0, 3778.0, 1916.0, 970.0, 529.0, 345.0, 204.0, 115.0, 86.0, 44.0, 32.0, 18.0, 13.0, 14.0, 14.0, 6.0, 8.0, 7.0, 2.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0], "bins": [-1.5556640625, -1.510223388671875, -1.46478271484375, -1.419342041015625, -1.3739013671875, -1.328460693359375, -1.28302001953125, -1.237579345703125, -1.192138671875, -1.146697998046875, -1.10125732421875, -1.055816650390625, -1.0103759765625, -0.964935302734375, -0.91949462890625, -0.874053955078125, -0.82861328125, -0.783172607421875, -0.73773193359375, -0.692291259765625, -0.6468505859375, -0.601409912109375, -0.55596923828125, -0.510528564453125, -0.465087890625, -0.419647216796875, -0.37420654296875, -0.328765869140625, -0.2833251953125, -0.237884521484375, -0.19244384765625, -0.147003173828125, -0.1015625, -0.056121826171875, -0.01068115234375, 0.034759521484375, 0.0802001953125, 0.125640869140625, 0.17108154296875, 0.216522216796875, 0.261962890625, 0.307403564453125, 0.35284423828125, 0.398284912109375, 0.4437255859375, 0.489166259765625, 0.53460693359375, 0.580047607421875, 0.62548828125, 0.670928955078125, 0.71636962890625, 0.761810302734375, 0.8072509765625, 0.852691650390625, 0.89813232421875, 0.943572998046875, 0.989013671875, 1.034454345703125, 1.07989501953125, 1.125335693359375, 1.1707763671875, 1.216217041015625, 1.26165771484375, 1.307098388671875, 1.3525390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 1.0, 5.0, 5.0, 3.0, 3.0, 8.0, 8.0, 8.0, 14.0, 14.0, 29.0, 45.0, 40.0, 52.0, 66.0, 74.0, 138.0, 120.0, 87.0, 44.0, 45.0, 28.0, 27.0, 33.0, 23.0, 13.0, 11.0, 10.0, 8.0, 7.0, 2.0, 5.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6075897216796875, -0.589691162109375, -0.5717926025390625, -0.55389404296875, -0.5359954833984375, -0.518096923828125, -0.5001983642578125, -0.4822998046875, -0.4644012451171875, -0.446502685546875, -0.4286041259765625, -0.41070556640625, -0.3928070068359375, -0.374908447265625, -0.3570098876953125, -0.339111328125, -0.3212127685546875, -0.303314208984375, -0.2854156494140625, -0.26751708984375, -0.2496185302734375, -0.231719970703125, -0.2138214111328125, -0.1959228515625, -0.1780242919921875, -0.160125732421875, -0.1422271728515625, -0.12432861328125, -0.1064300537109375, -0.088531494140625, -0.0706329345703125, -0.052734375, -0.0348358154296875, -0.016937255859375, 0.0009613037109375, 0.01885986328125, 0.0367584228515625, 0.054656982421875, 0.0725555419921875, 0.0904541015625, 0.1083526611328125, 0.126251220703125, 0.1441497802734375, 0.16204833984375, 0.1799468994140625, 0.197845458984375, 0.2157440185546875, 0.233642578125, 0.2515411376953125, 0.269439697265625, 0.2873382568359375, 0.30523681640625, 0.3231353759765625, 0.341033935546875, 0.3589324951171875, 0.3768310546875, 0.3947296142578125, 0.412628173828125, 0.4305267333984375, 0.44842529296875, 0.4663238525390625, 0.484222412109375, 0.5021209716796875, 0.52001953125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 20.0, 88.0, 236.0, 338.0, 231.0, 80.0, 16.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.21491813659668, -11.640115737915039, -9.065313339233398, -6.490509986877441, -3.915707588195801, -1.3409051895141602, 1.2338981628417969, 3.8087005615234375, 6.383502960205078, 8.958305358886719, 11.53310775756836, 14.107911109924316, 16.68271255493164, 19.25751495361328, 21.832319259643555, 24.407121658325195, 26.981924057006836, 29.556726455688477, 32.13153076171875, 34.70633316040039, 37.28113555908203, 39.85593795776367, 42.43074035644531, 45.00554275512695, 47.580345153808594, 50.155147552490234, 52.729949951171875, 55.304752349853516, 57.879554748535156, 60.4543571472168, 63.02915954589844, 65.60396575927734, 68.17876434326172, 70.75357055664062, 73.328369140625, 75.9031753540039, 78.47797393798828, 81.05278015136719, 83.62757873535156, 86.20238494873047, 88.77718353271484, 91.35198974609375, 93.92678833007812, 96.50159454345703, 99.0763931274414, 101.65119934082031, 104.22599792480469, 106.8008041381836, 109.3756103515625, 111.9504165649414, 114.52521514892578, 117.10002136230469, 119.67481994628906, 122.24962615966797, 124.82442474365234, 127.39923095703125, 129.97402954101562, 132.548828125, 135.12364196777344, 137.6984405517578, 140.2732391357422, 142.84803771972656, 145.4228515625, 147.99765014648438, 150.57244873046875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 7.0, 4.0, 11.0, 13.0, 8.0, 10.0, 17.0, 21.0, 17.0, 15.0, 20.0, 14.0, 33.0, 31.0, 28.0, 28.0, 32.0, 34.0, 38.0, 33.0, 40.0, 38.0, 34.0, 38.0, 37.0, 37.0, 41.0, 26.0, 31.0, 31.0, 34.0, 28.0, 23.0, 23.0, 22.0, 17.0, 14.0, 15.0, 12.0, 8.0, 9.0, 7.0, 12.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-54.5134162902832, -52.98008728027344, -51.44675827026367, -49.913429260253906, -48.380104064941406, -46.84677505493164, -45.313446044921875, -43.78011703491211, -42.246788024902344, -40.71345901489258, -39.18013000488281, -37.64680099487305, -36.11347198486328, -34.58014678955078, -33.046817779541016, -31.51348876953125, -29.980159759521484, -28.44683074951172, -26.913501739501953, -25.38017463684082, -23.846845626831055, -22.31351661682129, -20.780189514160156, -19.24686050415039, -17.713531494140625, -16.18020248413086, -14.64687442779541, -13.113546371459961, -11.580217361450195, -10.04688835144043, -8.51356029510498, -6.980232238769531, -5.446903228759766, -3.913574695587158, -2.380246162414551, -0.8469176292419434, 0.6864109039306641, 2.2197394371032715, 3.753067970275879, 5.286396026611328, 6.819725036621094, 8.35305404663086, 9.886382102966309, 11.419710159301758, 12.953039169311523, 14.486368179321289, 16.019695281982422, 17.553024291992188, 19.086353302001953, 20.61968231201172, 22.153011322021484, 23.686338424682617, 25.219667434692383, 26.75299644470215, 28.28632354736328, 29.819652557373047, 31.352981567382812, 32.88631057739258, 34.419639587402344, 35.95296859741211, 37.486297607421875, 39.019622802734375, 40.55295181274414, 42.086280822753906, 43.61960983276367]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 10.0, 4.0, 11.0, 22.0, 21.0, 21.0, 36.0, 67.0, 101.0, 150.0, 236.0, 422.0, 689.0, 1216.0, 2306.0, 4513.0, 9527.0, 22741.0, 67266.0, 299305.0, 1363011.0, 1838139.0, 440160.0, 93153.0, 28549.0, 11492.0, 5197.0, 2538.0, 1398.0, 778.0, 439.0, 256.0, 169.0, 105.0, 73.0, 39.0, 36.0, 25.0, 17.0, 15.0, 14.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.3515625, -10.0189208984375, -9.686279296875, -9.3536376953125, -9.02099609375, -8.6883544921875, -8.355712890625, -8.0230712890625, -7.6904296875, -7.3577880859375, -7.025146484375, -6.6925048828125, -6.35986328125, -6.0272216796875, -5.694580078125, -5.3619384765625, -5.029296875, -4.6966552734375, -4.364013671875, -4.0313720703125, -3.69873046875, -3.3660888671875, -3.033447265625, -2.7008056640625, -2.3681640625, -2.0355224609375, -1.702880859375, -1.3702392578125, -1.03759765625, -0.7049560546875, -0.372314453125, -0.0396728515625, 0.29296875, 0.6256103515625, 0.958251953125, 1.2908935546875, 1.62353515625, 1.9561767578125, 2.288818359375, 2.6214599609375, 2.9541015625, 3.2867431640625, 3.619384765625, 3.9520263671875, 4.28466796875, 4.6173095703125, 4.949951171875, 5.2825927734375, 5.615234375, 5.9478759765625, 6.280517578125, 6.6131591796875, 6.94580078125, 7.2784423828125, 7.611083984375, 7.9437255859375, 8.2763671875, 8.6090087890625, 8.941650390625, 9.2742919921875, 9.60693359375, 9.9395751953125, 10.272216796875, 10.6048583984375, 10.9375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 8.0, 14.0, 18.0, 22.0, 19.0, 19.0, 34.0, 35.0, 28.0, 34.0, 43.0, 39.0, 45.0, 38.0, 42.0, 44.0, 58.0, 33.0, 52.0, 35.0, 47.0, 29.0, 44.0, 27.0, 34.0, 29.0, 14.0, 18.0, 9.0, 8.0, 15.0, 5.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-10.1015625, -9.82958984375, -9.5576171875, -9.28564453125, -9.013671875, -8.74169921875, -8.4697265625, -8.19775390625, -7.92578125, -7.65380859375, -7.3818359375, -7.10986328125, -6.837890625, -6.56591796875, -6.2939453125, -6.02197265625, -5.75, -5.47802734375, -5.2060546875, -4.93408203125, -4.662109375, -4.39013671875, -4.1181640625, -3.84619140625, -3.57421875, -3.30224609375, -3.0302734375, -2.75830078125, -2.486328125, -2.21435546875, -1.9423828125, -1.67041015625, -1.3984375, -1.12646484375, -0.8544921875, -0.58251953125, -0.310546875, -0.03857421875, 0.2333984375, 0.50537109375, 0.77734375, 1.04931640625, 1.3212890625, 1.59326171875, 1.865234375, 2.13720703125, 2.4091796875, 2.68115234375, 2.953125, 3.22509765625, 3.4970703125, 3.76904296875, 4.041015625, 4.31298828125, 4.5849609375, 4.85693359375, 5.12890625, 5.40087890625, 5.6728515625, 5.94482421875, 6.216796875, 6.48876953125, 6.7607421875, 7.03271484375, 7.3046875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 15.0, 16.0, 46.0, 216.0, 3854418.0, 339300.0, 169.0, 46.0, 18.0, 17.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-410.5, -400.23046875, -389.9609375, -379.69140625, -369.421875, -359.15234375, -348.8828125, -338.61328125, -328.34375, -318.07421875, -307.8046875, -297.53515625, -287.265625, -276.99609375, -266.7265625, -256.45703125, -246.1875, -235.91796875, -225.6484375, -215.37890625, -205.109375, -194.83984375, -184.5703125, -174.30078125, -164.03125, -153.76171875, -143.4921875, -133.22265625, -122.953125, -112.68359375, -102.4140625, -92.14453125, -81.875, -71.60546875, -61.3359375, -51.06640625, -40.796875, -30.52734375, -20.2578125, -9.98828125, 0.28125, 10.55078125, 20.8203125, 31.08984375, 41.359375, 51.62890625, 61.8984375, 72.16796875, 82.4375, 92.70703125, 102.9765625, 113.24609375, 123.515625, 133.78515625, 144.0546875, 154.32421875, 164.59375, 174.86328125, 185.1328125, 195.40234375, 205.671875, 215.94140625, 226.2109375, 236.48046875, 246.75]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 22.0, 25.0, 26.0, 40.0, 52.0, 88.0, 136.0, 208.0, 346.0, 572.0, 868.0, 639.0, 376.0, 226.0, 144.0, 104.0, 59.0, 41.0, 16.0, 21.0, 16.0, 11.0, 3.0, 4.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.62213134765625, -4.4708251953125, -4.31951904296875, -4.168212890625, -4.01690673828125, -3.8656005859375, -3.71429443359375, -3.56298828125, -3.41168212890625, -3.2603759765625, -3.10906982421875, -2.957763671875, -2.80645751953125, -2.6551513671875, -2.50384521484375, -2.3525390625, -2.20123291015625, -2.0499267578125, -1.89862060546875, -1.747314453125, -1.59600830078125, -1.4447021484375, -1.29339599609375, -1.14208984375, -0.99078369140625, -0.8394775390625, -0.68817138671875, -0.536865234375, -0.38555908203125, -0.2342529296875, -0.08294677734375, 0.068359375, 0.21966552734375, 0.3709716796875, 0.52227783203125, 0.673583984375, 0.82489013671875, 0.9761962890625, 1.12750244140625, 1.27880859375, 1.43011474609375, 1.5814208984375, 1.73272705078125, 1.884033203125, 2.03533935546875, 2.1866455078125, 2.33795166015625, 2.4892578125, 2.64056396484375, 2.7918701171875, 2.94317626953125, 3.094482421875, 3.24578857421875, 3.3970947265625, 3.54840087890625, 3.69970703125, 3.85101318359375, 4.0023193359375, 4.15362548828125, 4.304931640625, 4.45623779296875, 4.6075439453125, 4.75885009765625, 4.91015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 9.0, 26.0, 33.0, 40.0, 50.0, 78.0, 80.0, 104.0, 114.0, 97.0, 83.0, 61.0, 78.0, 40.0, 31.0, 18.0, 18.0, 13.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.420784950256348, -14.867645263671875, -14.314505577087402, -13.76136589050293, -13.208227157592773, -12.655086517333984, -12.101947784423828, -11.548808097839355, -10.995668411254883, -10.44252872467041, -9.889389038085938, -9.336249351501465, -8.783109664916992, -8.229970932006836, -7.676831245422363, -7.123691558837891, -6.570551872253418, -6.017412185668945, -5.464272499084473, -4.911133289337158, -4.3579936027526855, -3.804853916168213, -3.2517144680023193, -2.698575019836426, -2.145435333251953, -1.59229576587677, -1.039156198501587, -0.4860166311264038, 0.0671229362487793, 0.620262622833252, 1.1734020709991455, 1.726541519165039, 2.279682159423828, 2.832821846008301, 3.3859612941741943, 3.939100742340088, 4.4922404289245605, 5.045380115509033, 5.598519325256348, 6.15165901184082, 6.704798698425293, 7.257938385009766, 7.811078071594238, 8.364217758178711, 8.917356491088867, 9.470497131347656, 10.023635864257812, 10.576775550842285, 11.129915237426758, 11.68305492401123, 12.236194610595703, 12.789334297180176, 13.342473983764648, 13.895612716674805, 14.448752403259277, 15.00189208984375, 15.555031776428223, 16.108171463012695, 16.66131019592285, 17.21445083618164, 17.767589569091797, 18.320730209350586, 18.873868942260742, 19.42700958251953, 19.980148315429688]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 9.0, 7.0, 12.0, 9.0, 16.0, 23.0, 21.0, 33.0, 24.0, 26.0, 29.0, 28.0, 35.0, 40.0, 55.0, 42.0, 46.0, 51.0, 37.0, 47.0, 46.0, 40.0, 36.0, 35.0, 27.0, 23.0, 35.0, 19.0, 25.0, 21.0, 15.0, 18.0, 14.0, 14.0, 13.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.179637908935547, -8.89326286315918, -8.606888771057129, -8.320513725280762, -8.034138679504395, -7.7477641105651855, -7.461389541625977, -7.175014495849609, -6.8886399269104, -6.602265357971191, -6.315890312194824, -6.029515743255615, -5.743141174316406, -5.456766128540039, -5.17039155960083, -4.884016990661621, -4.597641944885254, -4.311267375946045, -4.024892330169678, -3.7385177612304688, -3.4521429538726807, -3.1657681465148926, -2.8793935775756836, -2.5930187702178955, -2.3066439628601074, -2.0202691555023193, -1.7338944673538208, -1.4475197792053223, -1.1611449718475342, -0.8747701644897461, -0.5883954763412476, -0.302020788192749, -0.015646934509277344, 0.27072781324386597, 0.5571025609970093, 0.8434773087501526, 1.129852056503296, 1.416226863861084, 1.7026015520095825, 1.988976240158081, 2.275351047515869, 2.5617258548736572, 2.8481006622314453, 3.1344752311706543, 3.4208500385284424, 3.7072248458862305, 3.9935994148254395, 4.279973983764648, 4.566349029541016, 4.852723598480225, 5.139098644256592, 5.425473213195801, 5.711848258972168, 5.998222827911377, 6.284597396850586, 6.570972442626953, 6.857347011566162, 7.143721580505371, 7.430096626281738, 7.716471195220947, 8.002845764160156, 8.289220809936523, 8.57559585571289, 8.861969947814941, 9.148344993591309]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 5.0, 10.0, 13.0, 25.0, 50.0, 65.0, 126.0, 197.0, 395.0, 635.0, 1182.0, 2291.0, 4624.0, 10327.0, 24724.0, 66349.0, 178856.0, 359565.0, 244010.0, 94274.0, 34591.0, 13863.0, 6096.0, 2908.0, 1533.0, 806.0, 438.0, 248.0, 141.0, 83.0, 51.0, 21.0, 20.0, 15.0, 10.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.21795654296875, -4.0804443359375, -3.94293212890625, -3.805419921875, -3.66790771484375, -3.5303955078125, -3.39288330078125, -3.25537109375, -3.11785888671875, -2.9803466796875, -2.84283447265625, -2.705322265625, -2.56781005859375, -2.4302978515625, -2.29278564453125, -2.1552734375, -2.01776123046875, -1.8802490234375, -1.74273681640625, -1.605224609375, -1.46771240234375, -1.3302001953125, -1.19268798828125, -1.05517578125, -0.91766357421875, -0.7801513671875, -0.64263916015625, -0.505126953125, -0.36761474609375, -0.2301025390625, -0.09259033203125, 0.044921875, 0.18243408203125, 0.3199462890625, 0.45745849609375, 0.594970703125, 0.73248291015625, 0.8699951171875, 1.00750732421875, 1.14501953125, 1.28253173828125, 1.4200439453125, 1.55755615234375, 1.695068359375, 1.83258056640625, 1.9700927734375, 2.10760498046875, 2.2451171875, 2.38262939453125, 2.5201416015625, 2.65765380859375, 2.795166015625, 2.93267822265625, 3.0701904296875, 3.20770263671875, 3.34521484375, 3.48272705078125, 3.6202392578125, 3.75775146484375, 3.895263671875, 4.03277587890625, 4.1702880859375, 4.30780029296875, 4.4453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 4.0, 4.0, 7.0, 10.0, 8.0, 14.0, 16.0, 18.0, 28.0, 17.0, 23.0, 41.0, 31.0, 43.0, 48.0, 47.0, 47.0, 50.0, 41.0, 57.0, 47.0, 55.0, 42.0, 37.0, 29.0, 35.0, 31.0, 32.0, 23.0, 25.0, 16.0, 14.0, 20.0, 9.0, 9.0, 7.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-7.6953125, -7.49102783203125, -7.2867431640625, -7.08245849609375, -6.878173828125, -6.67388916015625, -6.4696044921875, -6.26531982421875, -6.06103515625, -5.85675048828125, -5.6524658203125, -5.44818115234375, -5.243896484375, -5.03961181640625, -4.8353271484375, -4.63104248046875, -4.4267578125, -4.22247314453125, -4.0181884765625, -3.81390380859375, -3.609619140625, -3.40533447265625, -3.2010498046875, -2.99676513671875, -2.79248046875, -2.58819580078125, -2.3839111328125, -2.17962646484375, -1.975341796875, -1.77105712890625, -1.5667724609375, -1.36248779296875, -1.158203125, -0.95391845703125, -0.7496337890625, -0.54534912109375, -0.341064453125, -0.13677978515625, 0.0675048828125, 0.27178955078125, 0.47607421875, 0.68035888671875, 0.8846435546875, 1.08892822265625, 1.293212890625, 1.49749755859375, 1.7017822265625, 1.90606689453125, 2.1103515625, 2.31463623046875, 2.5189208984375, 2.72320556640625, 2.927490234375, 3.13177490234375, 3.3360595703125, 3.54034423828125, 3.74462890625, 3.94891357421875, 4.1531982421875, 4.35748291015625, 4.561767578125, 4.76605224609375, 4.9703369140625, 5.17462158203125, 5.37890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 9.0, 13.0, 14.0, 27.0, 37.0, 67.0, 97.0, 124.0, 209.0, 351.0, 635.0, 1093.0, 2201.0, 4759.0, 11178.0, 28850.0, 84602.0, 265057.0, 411362.0, 155680.0, 49827.0, 18139.0, 7279.0, 3320.0, 1642.0, 767.0, 455.0, 260.0, 159.0, 95.0, 67.0, 38.0, 36.0, 28.0, 17.0, 7.0, 6.0, 8.0, 6.0, 2.0, 3.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.2265625, -4.09136962890625, -3.9561767578125, -3.82098388671875, -3.685791015625, -3.55059814453125, -3.4154052734375, -3.28021240234375, -3.14501953125, -3.00982666015625, -2.8746337890625, -2.73944091796875, -2.604248046875, -2.46905517578125, -2.3338623046875, -2.19866943359375, -2.0634765625, -1.92828369140625, -1.7930908203125, -1.65789794921875, -1.522705078125, -1.38751220703125, -1.2523193359375, -1.11712646484375, -0.98193359375, -0.84674072265625, -0.7115478515625, -0.57635498046875, -0.441162109375, -0.30596923828125, -0.1707763671875, -0.03558349609375, 0.099609375, 0.23480224609375, 0.3699951171875, 0.50518798828125, 0.640380859375, 0.77557373046875, 0.9107666015625, 1.04595947265625, 1.18115234375, 1.31634521484375, 1.4515380859375, 1.58673095703125, 1.721923828125, 1.85711669921875, 1.9923095703125, 2.12750244140625, 2.2626953125, 2.39788818359375, 2.5330810546875, 2.66827392578125, 2.803466796875, 2.93865966796875, 3.0738525390625, 3.20904541015625, 3.34423828125, 3.47943115234375, 3.6146240234375, 3.74981689453125, 3.885009765625, 4.02020263671875, 4.1553955078125, 4.29058837890625, 4.42578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 2.0, 8.0, 6.0, 5.0, 10.0, 16.0, 21.0, 14.0, 15.0, 24.0, 16.0, 26.0, 34.0, 23.0, 33.0, 43.0, 35.0, 44.0, 37.0, 43.0, 47.0, 35.0, 48.0, 44.0, 47.0, 39.0, 31.0, 36.0, 42.0, 27.0, 12.0, 17.0, 21.0, 12.0, 12.0, 15.0, 8.0, 13.0, 9.0, 4.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 6.0], "bins": [-12.5546875, -12.21630859375, -11.8779296875, -11.53955078125, -11.201171875, -10.86279296875, -10.5244140625, -10.18603515625, -9.84765625, -9.50927734375, -9.1708984375, -8.83251953125, -8.494140625, -8.15576171875, -7.8173828125, -7.47900390625, -7.140625, -6.80224609375, -6.4638671875, -6.12548828125, -5.787109375, -5.44873046875, -5.1103515625, -4.77197265625, -4.43359375, -4.09521484375, -3.7568359375, -3.41845703125, -3.080078125, -2.74169921875, -2.4033203125, -2.06494140625, -1.7265625, -1.38818359375, -1.0498046875, -0.71142578125, -0.373046875, -0.03466796875, 0.3037109375, 0.64208984375, 0.98046875, 1.31884765625, 1.6572265625, 1.99560546875, 2.333984375, 2.67236328125, 3.0107421875, 3.34912109375, 3.6875, 4.02587890625, 4.3642578125, 4.70263671875, 5.041015625, 5.37939453125, 5.7177734375, 6.05615234375, 6.39453125, 6.73291015625, 7.0712890625, 7.40966796875, 7.748046875, 8.08642578125, 8.4248046875, 8.76318359375, 9.1015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 16.0, 15.0, 28.0, 28.0, 49.0, 50.0, 98.0, 133.0, 286.0, 519.0, 980.0, 1956.0, 4909.0, 13979.0, 49075.0, 243317.0, 552220.0, 134330.0, 30175.0, 9435.0, 3604.0, 1579.0, 737.0, 388.0, 228.0, 123.0, 89.0, 58.0, 43.0, 21.0, 15.0, 11.0, 10.0, 7.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.521484375, -2.4434814453125, -2.365478515625, -2.2874755859375, -2.20947265625, -2.1314697265625, -2.053466796875, -1.9754638671875, -1.8974609375, -1.8194580078125, -1.741455078125, -1.6634521484375, -1.58544921875, -1.5074462890625, -1.429443359375, -1.3514404296875, -1.2734375, -1.1954345703125, -1.117431640625, -1.0394287109375, -0.96142578125, -0.8834228515625, -0.805419921875, -0.7274169921875, -0.6494140625, -0.5714111328125, -0.493408203125, -0.4154052734375, -0.33740234375, -0.2593994140625, -0.181396484375, -0.1033935546875, -0.025390625, 0.0526123046875, 0.130615234375, 0.2086181640625, 0.28662109375, 0.3646240234375, 0.442626953125, 0.5206298828125, 0.5986328125, 0.6766357421875, 0.754638671875, 0.8326416015625, 0.91064453125, 0.9886474609375, 1.066650390625, 1.1446533203125, 1.22265625, 1.3006591796875, 1.378662109375, 1.4566650390625, 1.53466796875, 1.6126708984375, 1.690673828125, 1.7686767578125, 1.8466796875, 1.9246826171875, 2.002685546875, 2.0806884765625, 2.15869140625, 2.2366943359375, 2.314697265625, 2.3927001953125, 2.470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 15.0, 8.0, 17.0, 13.0, 25.0, 31.0, 26.0, 42.0, 54.0, 71.0, 75.0, 99.0, 76.0, 92.0, 68.0, 51.0, 46.0, 38.0, 39.0, 14.0, 14.0, 15.0, 11.0, 14.0, 12.0, 10.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0011110305786132812, -0.0010795444250106812, -0.001048058271408081, -0.001016572117805481, -0.0009850859642028809, -0.0009535998106002808, -0.0009221136569976807, -0.0008906275033950806, -0.0008591413497924805, -0.0008276551961898804, -0.0007961690425872803, -0.0007646828889846802, -0.0007331967353820801, -0.00070171058177948, -0.0006702244281768799, -0.0006387382745742798, -0.0006072521209716797, -0.0005757659673690796, -0.0005442798137664795, -0.0005127936601638794, -0.0004813075065612793, -0.0004498213529586792, -0.0004183351993560791, -0.000386849045753479, -0.0003553628921508789, -0.0003238767385482788, -0.0002923905849456787, -0.0002609044313430786, -0.00022941827774047852, -0.00019793212413787842, -0.00016644597053527832, -0.00013495981693267822, -0.00010347366333007812, -7.198750972747803e-05, -4.050135612487793e-05, -9.015202522277832e-06, 2.2470951080322266e-05, 5.395710468292236e-05, 8.544325828552246e-05, 0.00011692941188812256, 0.00014841556549072266, 0.00017990171909332275, 0.00021138787269592285, 0.00024287402629852295, 0.00027436017990112305, 0.00030584633350372314, 0.00033733248710632324, 0.00036881864070892334, 0.00040030479431152344, 0.00043179094791412354, 0.00046327710151672363, 0.0004947632551193237, 0.0005262494087219238, 0.0005577355623245239, 0.000589221715927124, 0.0006207078695297241, 0.0006521940231323242, 0.0006836801767349243, 0.0007151663303375244, 0.0007466524839401245, 0.0007781386375427246, 0.0008096247911453247, 0.0008411109447479248, 0.0008725970983505249, 0.000904083251953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 3.0, 11.0, 20.0, 8.0, 20.0, 24.0, 28.0, 38.0, 74.0, 135.0, 383.0, 1536.0, 11829.0, 276534.0, 723367.0, 30615.0, 2799.0, 630.0, 204.0, 89.0, 53.0, 35.0, 24.0, 14.0, 14.0, 13.0, 10.0, 8.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.22265625, -5.049560546875, -4.87646484375, -4.703369140625, -4.5302734375, -4.357177734375, -4.18408203125, -4.010986328125, -3.837890625, -3.664794921875, -3.49169921875, -3.318603515625, -3.1455078125, -2.972412109375, -2.79931640625, -2.626220703125, -2.453125, -2.280029296875, -2.10693359375, -1.933837890625, -1.7607421875, -1.587646484375, -1.41455078125, -1.241455078125, -1.068359375, -0.895263671875, -0.72216796875, -0.549072265625, -0.3759765625, -0.202880859375, -0.02978515625, 0.143310546875, 0.31640625, 0.489501953125, 0.66259765625, 0.835693359375, 1.0087890625, 1.181884765625, 1.35498046875, 1.528076171875, 1.701171875, 1.874267578125, 2.04736328125, 2.220458984375, 2.3935546875, 2.566650390625, 2.73974609375, 2.912841796875, 3.0859375, 3.259033203125, 3.43212890625, 3.605224609375, 3.7783203125, 3.951416015625, 4.12451171875, 4.297607421875, 4.470703125, 4.643798828125, 4.81689453125, 4.989990234375, 5.1630859375, 5.336181640625, 5.50927734375, 5.682373046875, 5.85546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 6.0, 12.0, 14.0, 16.0, 17.0, 33.0, 42.0, 53.0, 77.0, 101.0, 102.0, 89.0, 105.0, 70.0, 71.0, 54.0, 34.0, 29.0, 23.0, 18.0, 10.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90966796875, -0.8845901489257812, -0.8595123291015625, -0.8344345092773438, -0.809356689453125, -0.7842788696289062, -0.7592010498046875, -0.7341232299804688, -0.70904541015625, -0.6839675903320312, -0.6588897705078125, -0.6338119506835938, -0.608734130859375, -0.5836563110351562, -0.5585784912109375, -0.5335006713867188, -0.5084228515625, -0.48334503173828125, -0.4582672119140625, -0.43318939208984375, -0.408111572265625, -0.38303375244140625, -0.3579559326171875, -0.33287811279296875, -0.30780029296875, -0.28272247314453125, -0.2576446533203125, -0.23256683349609375, -0.207489013671875, -0.18241119384765625, -0.1573333740234375, -0.13225555419921875, -0.107177734375, -0.08209991455078125, -0.0570220947265625, -0.03194427490234375, -0.006866455078125, 0.01821136474609375, 0.0432891845703125, 0.06836700439453125, 0.09344482421875, 0.11852264404296875, 0.1436004638671875, 0.16867828369140625, 0.193756103515625, 0.21883392333984375, 0.2439117431640625, 0.26898956298828125, 0.2940673828125, 0.31914520263671875, 0.3442230224609375, 0.36930084228515625, 0.394378662109375, 0.41945648193359375, 0.4445343017578125, 0.46961212158203125, 0.49468994140625, 0.5197677612304688, 0.5448455810546875, 0.5699234008789062, 0.595001220703125, 0.6200790405273438, 0.6451568603515625, 0.6702346801757812, 0.6953125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 21.0, 20.0, 37.0, 52.0, 62.0, 86.0, 106.0, 132.0, 116.0, 108.0, 77.0, 53.0, 45.0, 23.0, 15.0, 12.0, 8.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.724215507507324, -11.343389511108398, -10.962564468383789, -10.58173942565918, -10.200913429260254, -9.820087432861328, -9.439262390136719, -9.05843734741211, -8.677611351013184, -8.296785354614258, -7.915960311889648, -7.535134792327881, -7.154309272766113, -6.773483753204346, -6.392658233642578, -6.0118327140808105, -5.631007194519043, -5.250181674957275, -4.869356155395508, -4.48853063583374, -4.107705116271973, -3.726879596710205, -3.3460540771484375, -2.96522855758667, -2.5844030380249023, -2.2035775184631348, -1.8227519989013672, -1.4419264793395996, -1.061100959777832, -0.6802754402160645, -0.2994499206542969, 0.0813755989074707, 0.4622011184692383, 0.8430266380310059, 1.2238521575927734, 1.604677677154541, 1.9855031967163086, 2.366328716278076, 2.7471542358398438, 3.1279797554016113, 3.508805274963379, 3.8896307945251465, 4.270456314086914, 4.651281833648682, 5.032107353210449, 5.412932872772217, 5.793758392333984, 6.174583911895752, 6.5554094314575195, 6.936234951019287, 7.317060470581055, 7.697885990142822, 8.07871150970459, 8.459537506103516, 8.840362548828125, 9.221187591552734, 9.60201358795166, 9.982839584350586, 10.363664627075195, 10.744489669799805, 11.12531566619873, 11.506141662597656, 11.886966705322266, 12.267791748046875, 12.6486177444458]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 8.0, 9.0, 11.0, 16.0, 22.0, 25.0, 27.0, 32.0, 21.0, 42.0, 50.0, 38.0, 57.0, 47.0, 43.0, 46.0, 48.0, 54.0, 48.0, 31.0, 43.0, 43.0, 30.0, 20.0, 25.0, 22.0, 26.0, 16.0, 26.0, 20.0, 9.0, 5.0, 7.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.660863399505615, -6.4587483406066895, -6.2566328048706055, -6.05451774597168, -5.852402687072754, -5.650287628173828, -5.448172569274902, -5.246057033538818, -5.043941974639893, -4.841826915740967, -4.639711380004883, -4.437596321105957, -4.235481262207031, -4.0333662033081055, -3.8312509059906006, -3.6291356086730957, -3.42702054977417, -3.224905490875244, -3.0227901935577393, -2.8206748962402344, -2.6185598373413086, -2.416444778442383, -2.214329481124878, -2.012214183807373, -1.8100991249084473, -1.607983946800232, -1.4058687686920166, -1.2037535905838013, -1.001638412475586, -0.7995232343673706, -0.5974080562591553, -0.39529287815093994, -0.1931777000427246, 0.008937478065490723, 0.21105265617370605, 0.4131678342819214, 0.6152830123901367, 0.817398190498352, 1.0195133686065674, 1.2216285467147827, 1.423743724822998, 1.6258589029312134, 1.8279740810394287, 2.0300893783569336, 2.2322044372558594, 2.434319496154785, 2.63643479347229, 2.838550090789795, 3.0406651496887207, 3.2427802085876465, 3.4448955059051514, 3.6470108032226562, 3.849125862121582, 4.051240921020508, 4.253355979919434, 4.455471515655518, 4.657586574554443, 4.859701633453369, 5.061817169189453, 5.263932228088379, 5.466047286987305, 5.6681623458862305, 5.870277404785156, 6.07239294052124, 6.274507999420166]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 6.0, 6.0, 8.0, 28.0, 39.0, 68.0, 148.0, 288.0, 552.0, 1060.0, 2181.0, 4716.0, 10863.0, 27660.0, 80539.0, 304231.0, 433970.0, 117962.0, 38281.0, 14468.0, 6153.0, 2650.0, 1327.0, 653.0, 306.0, 165.0, 96.0, 51.0, 32.0, 18.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.109375, -5.92510986328125, -5.7408447265625, -5.55657958984375, -5.372314453125, -5.18804931640625, -5.0037841796875, -4.81951904296875, -4.63525390625, -4.45098876953125, -4.2667236328125, -4.08245849609375, -3.898193359375, -3.71392822265625, -3.5296630859375, -3.34539794921875, -3.1611328125, -2.97686767578125, -2.7926025390625, -2.60833740234375, -2.424072265625, -2.23980712890625, -2.0555419921875, -1.87127685546875, -1.68701171875, -1.50274658203125, -1.3184814453125, -1.13421630859375, -0.949951171875, -0.76568603515625, -0.5814208984375, -0.39715576171875, -0.212890625, -0.02862548828125, 0.1556396484375, 0.33990478515625, 0.524169921875, 0.70843505859375, 0.8927001953125, 1.07696533203125, 1.26123046875, 1.44549560546875, 1.6297607421875, 1.81402587890625, 1.998291015625, 2.18255615234375, 2.3668212890625, 2.55108642578125, 2.7353515625, 2.91961669921875, 3.1038818359375, 3.28814697265625, 3.472412109375, 3.65667724609375, 3.8409423828125, 4.02520751953125, 4.20947265625, 4.39373779296875, 4.5780029296875, 4.76226806640625, 4.946533203125, 5.13079833984375, 5.3150634765625, 5.49932861328125, 5.68359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 11.0, 3.0, 10.0, 8.0, 6.0, 18.0, 18.0, 14.0, 19.0, 20.0, 23.0, 33.0, 27.0, 43.0, 27.0, 39.0, 49.0, 38.0, 47.0, 48.0, 57.0, 46.0, 50.0, 41.0, 38.0, 29.0, 28.0, 34.0, 29.0, 14.0, 28.0, 27.0, 22.0, 12.0, 11.0, 6.0, 4.0, 7.0, 3.0, 7.0, 8.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-21.515625, -20.946044921875, -20.37646484375, -19.806884765625, -19.2373046875, -18.667724609375, -18.09814453125, -17.528564453125, -16.958984375, -16.389404296875, -15.81982421875, -15.250244140625, -14.6806640625, -14.111083984375, -13.54150390625, -12.971923828125, -12.40234375, -11.832763671875, -11.26318359375, -10.693603515625, -10.1240234375, -9.554443359375, -8.98486328125, -8.415283203125, -7.845703125, -7.276123046875, -6.70654296875, -6.136962890625, -5.5673828125, -4.997802734375, -4.42822265625, -3.858642578125, -3.2890625, -2.719482421875, -2.14990234375, -1.580322265625, -1.0107421875, -0.441162109375, 0.12841796875, 0.697998046875, 1.267578125, 1.837158203125, 2.40673828125, 2.976318359375, 3.5458984375, 4.115478515625, 4.68505859375, 5.254638671875, 5.82421875, 6.393798828125, 6.96337890625, 7.532958984375, 8.1025390625, 8.672119140625, 9.24169921875, 9.811279296875, 10.380859375, 10.950439453125, 11.52001953125, 12.089599609375, 12.6591796875, 13.228759765625, 13.79833984375, 14.367919921875, 14.9375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 5.0, 7.0, 5.0, 11.0, 9.0, 16.0, 26.0, 26.0, 24.0, 29.0, 23.0, 39.0, 61.0, 80.0, 98.0, 149.0, 585.0, 1031426.0, 15200.0, 251.0, 118.0, 73.0, 62.0, 42.0, 33.0, 24.0, 26.0, 23.0, 18.0, 8.0, 9.0, 6.0, 8.0, 7.0, 6.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.4375, -65.24609375, -63.0546875, -60.86328125, -58.671875, -56.48046875, -54.2890625, -52.09765625, -49.90625, -47.71484375, -45.5234375, -43.33203125, -41.140625, -38.94921875, -36.7578125, -34.56640625, -32.375, -30.18359375, -27.9921875, -25.80078125, -23.609375, -21.41796875, -19.2265625, -17.03515625, -14.84375, -12.65234375, -10.4609375, -8.26953125, -6.078125, -3.88671875, -1.6953125, 0.49609375, 2.6875, 4.87890625, 7.0703125, 9.26171875, 11.453125, 13.64453125, 15.8359375, 18.02734375, 20.21875, 22.41015625, 24.6015625, 26.79296875, 28.984375, 31.17578125, 33.3671875, 35.55859375, 37.75, 39.94140625, 42.1328125, 44.32421875, 46.515625, 48.70703125, 50.8984375, 53.08984375, 55.28125, 57.47265625, 59.6640625, 61.85546875, 64.046875, 66.23828125, 68.4296875, 70.62109375, 72.8125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 0.0, 4.0, 5.0, 8.0, 2.0, 13.0, 7.0, 21.0, 23.0, 23.0, 27.0, 26.0, 28.0, 30.0, 53.0, 59.0, 61.0, 55.0, 52.0, 60.0, 41.0, 56.0, 38.0, 50.0, 40.0, 32.0, 28.0, 29.0, 26.0, 22.0, 20.0, 8.0, 8.0, 6.0, 7.0, 9.0, 8.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.390625, -21.66552734375, -20.9404296875, -20.21533203125, -19.490234375, -18.76513671875, -18.0400390625, -17.31494140625, -16.58984375, -15.86474609375, -15.1396484375, -14.41455078125, -13.689453125, -12.96435546875, -12.2392578125, -11.51416015625, -10.7890625, -10.06396484375, -9.3388671875, -8.61376953125, -7.888671875, -7.16357421875, -6.4384765625, -5.71337890625, -4.98828125, -4.26318359375, -3.5380859375, -2.81298828125, -2.087890625, -1.36279296875, -0.6376953125, 0.08740234375, 0.8125, 1.53759765625, 2.2626953125, 2.98779296875, 3.712890625, 4.43798828125, 5.1630859375, 5.88818359375, 6.61328125, 7.33837890625, 8.0634765625, 8.78857421875, 9.513671875, 10.23876953125, 10.9638671875, 11.68896484375, 12.4140625, 13.13916015625, 13.8642578125, 14.58935546875, 15.314453125, 16.03955078125, 16.7646484375, 17.48974609375, 18.21484375, 18.93994140625, 19.6650390625, 20.39013671875, 21.115234375, 21.84033203125, 22.5654296875, 23.29052734375, 24.015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 9.0, 3.0, 8.0, 7.0, 12.0, 15.0, 27.0, 33.0, 82.0, 173.0, 533.0, 1941.0, 13494.0, 827447.0, 194927.0, 7766.0, 1332.0, 399.0, 152.0, 71.0, 29.0, 18.0, 14.0, 15.0, 8.0, 14.0, 8.0, 1.0, 6.0, 1.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.88671875, -7.6468505859375, -7.406982421875, -7.1671142578125, -6.92724609375, -6.6873779296875, -6.447509765625, -6.2076416015625, -5.9677734375, -5.7279052734375, -5.488037109375, -5.2481689453125, -5.00830078125, -4.7684326171875, -4.528564453125, -4.2886962890625, -4.048828125, -3.8089599609375, -3.569091796875, -3.3292236328125, -3.08935546875, -2.8494873046875, -2.609619140625, -2.3697509765625, -2.1298828125, -1.8900146484375, -1.650146484375, -1.4102783203125, -1.17041015625, -0.9305419921875, -0.690673828125, -0.4508056640625, -0.2109375, 0.0289306640625, 0.268798828125, 0.5086669921875, 0.74853515625, 0.9884033203125, 1.228271484375, 1.4681396484375, 1.7080078125, 1.9478759765625, 2.187744140625, 2.4276123046875, 2.66748046875, 2.9073486328125, 3.147216796875, 3.3870849609375, 3.626953125, 3.8668212890625, 4.106689453125, 4.3465576171875, 4.58642578125, 4.8262939453125, 5.066162109375, 5.3060302734375, 5.5458984375, 5.7857666015625, 6.025634765625, 6.2655029296875, 6.50537109375, 6.7452392578125, 6.985107421875, 7.2249755859375, 7.46484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 4.0, 8.0, 11.0, 22.0, 36.0, 60.0, 96.0, 241.0, 219.0, 118.0, 57.0, 40.0, 24.0, 15.0, 14.0, 6.0, 3.0, 11.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000522613525390625, -0.0005025789141654968, -0.00048254430294036865, -0.0004625096917152405, -0.0004424750804901123, -0.00042244046926498413, -0.00040240585803985596, -0.0003823712468147278, -0.0003623366355895996, -0.00034230202436447144, -0.00032226741313934326, -0.0003022328019142151, -0.0002821981906890869, -0.00026216357946395874, -0.00024212896823883057, -0.0002220943570137024, -0.00020205974578857422, -0.00018202513456344604, -0.00016199052333831787, -0.0001419559121131897, -0.00012192130088806152, -0.00010188668966293335, -8.185207843780518e-05, -6.1817467212677e-05, -4.178285598754883e-05, -2.1748244762420654e-05, -1.7136335372924805e-06, 1.8320977687835693e-05, 3.835558891296387e-05, 5.839020013809204e-05, 7.842481136322021e-05, 9.845942258834839e-05, 0.00011849403381347656, 0.00013852864503860474, 0.0001585632562637329, 0.00017859786748886108, 0.00019863247871398926, 0.00021866708993911743, 0.0002387017011642456, 0.0002587363123893738, 0.00027877092361450195, 0.0002988055348396301, 0.0003188401460647583, 0.0003388747572898865, 0.00035890936851501465, 0.0003789439797401428, 0.000398978590965271, 0.00041901320219039917, 0.00043904781341552734, 0.0004590824246406555, 0.0004791170358657837, 0.0004991516470909119, 0.00051918625831604, 0.0005392208695411682, 0.0005592554807662964, 0.0005792900919914246, 0.0005993247032165527, 0.0006193593144416809, 0.0006393939256668091, 0.0006594285368919373, 0.0006794631481170654, 0.0006994977593421936, 0.0007195323705673218, 0.00073956698179245, 0.0007596015930175781]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 9.0, 3.0, 11.0, 18.0, 27.0, 42.0, 77.0, 133.0, 378.0, 1425.0, 6823.0, 85709.0, 920048.0, 28552.0, 3791.0, 943.0, 249.0, 131.0, 67.0, 35.0, 21.0, 19.0, 13.0, 5.0, 4.0, 2.0, 2.0, 2.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.73828125, -7.5252685546875, -7.312255859375, -7.0992431640625, -6.88623046875, -6.6732177734375, -6.460205078125, -6.2471923828125, -6.0341796875, -5.8211669921875, -5.608154296875, -5.3951416015625, -5.18212890625, -4.9691162109375, -4.756103515625, -4.5430908203125, -4.330078125, -4.1170654296875, -3.904052734375, -3.6910400390625, -3.47802734375, -3.2650146484375, -3.052001953125, -2.8389892578125, -2.6259765625, -2.4129638671875, -2.199951171875, -1.9869384765625, -1.77392578125, -1.5609130859375, -1.347900390625, -1.1348876953125, -0.921875, -0.7088623046875, -0.495849609375, -0.2828369140625, -0.06982421875, 0.1431884765625, 0.356201171875, 0.5692138671875, 0.7822265625, 0.9952392578125, 1.208251953125, 1.4212646484375, 1.63427734375, 1.8472900390625, 2.060302734375, 2.2733154296875, 2.486328125, 2.6993408203125, 2.912353515625, 3.1253662109375, 3.33837890625, 3.5513916015625, 3.764404296875, 3.9774169921875, 4.1904296875, 4.4034423828125, 4.616455078125, 4.8294677734375, 5.04248046875, 5.2554931640625, 5.468505859375, 5.6815185546875, 5.89453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 7.0, 3.0, 16.0, 19.0, 23.0, 35.0, 51.0, 97.0, 211.0, 253.0, 87.0, 55.0, 39.0, 27.0, 18.0, 9.0, 15.0, 4.0, 2.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0134429931640625, -0.965362548828125, -0.9172821044921875, -0.86920166015625, -0.8211212158203125, -0.773040771484375, -0.7249603271484375, -0.6768798828125, -0.6287994384765625, -0.580718994140625, -0.5326385498046875, -0.48455810546875, -0.4364776611328125, -0.388397216796875, -0.3403167724609375, -0.292236328125, -0.2441558837890625, -0.196075439453125, -0.1479949951171875, -0.09991455078125, -0.0518341064453125, -0.003753662109375, 0.0443267822265625, 0.0924072265625, 0.1404876708984375, 0.188568115234375, 0.2366485595703125, 0.28472900390625, 0.3328094482421875, 0.380889892578125, 0.4289703369140625, 0.47705078125, 0.5251312255859375, 0.573211669921875, 0.6212921142578125, 0.66937255859375, 0.7174530029296875, 0.765533447265625, 0.8136138916015625, 0.8616943359375, 0.9097747802734375, 0.957855224609375, 1.0059356689453125, 1.05401611328125, 1.1020965576171875, 1.150177001953125, 1.1982574462890625, 1.246337890625, 1.2944183349609375, 1.342498779296875, 1.3905792236328125, 1.43865966796875, 1.4867401123046875, 1.534820556640625, 1.5829010009765625, 1.6309814453125, 1.6790618896484375, 1.727142333984375, 1.7752227783203125, 1.82330322265625, 1.8713836669921875, 1.919464111328125, 1.9675445556640625, 2.015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 19.0, 43.0, 90.0, 148.0, 220.0, 224.0, 133.0, 71.0, 30.0, 16.0, 6.0, 9.0, 1.0, 2.0, 0.0, 2.0], "bins": [-75.38662719726562, -73.96429443359375, -72.54196166992188, -71.11962890625, -69.69729614257812, -68.27496337890625, -66.85263061523438, -65.43029022216797, -64.0079574584961, -62.58562469482422, -61.163291931152344, -59.74095916748047, -58.31862258911133, -56.89628982543945, -55.47395706176758, -54.0516242980957, -52.62929153442383, -51.20695877075195, -49.78462600708008, -48.36228942871094, -46.93995666503906, -45.51762390136719, -44.09529113769531, -42.67295837402344, -41.25062561035156, -39.82829284667969, -38.40596008300781, -36.98362731933594, -35.5612907409668, -34.13895797729492, -32.71662521362305, -31.294292449951172, -29.871959686279297, -28.449626922607422, -27.027292251586914, -25.60495948791504, -24.18262481689453, -22.760292053222656, -21.33795928955078, -19.915626525878906, -18.4932918548584, -17.070959091186523, -15.648624420166016, -14.22629165649414, -12.80395793914795, -11.381624221801758, -9.959291458129883, -8.536957740783691, -7.1146240234375, -5.692290306091309, -4.269957065582275, -2.847623825073242, -1.4252901077270508, -0.002956390380859375, 1.4193763732910156, 2.841710090637207, 4.264043807983398, 5.68637752532959, 7.108710765838623, 8.531044006347656, 9.953377723693848, 11.375711441040039, 12.798044204711914, 14.220377922058105, 15.642711639404297]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 3.0, 7.0, 11.0, 6.0, 11.0, 15.0, 14.0, 16.0, 17.0, 27.0, 24.0, 29.0, 25.0, 34.0, 27.0, 36.0, 33.0, 44.0, 38.0, 40.0, 31.0, 43.0, 31.0, 42.0, 35.0, 35.0, 35.0, 35.0, 29.0, 25.0, 25.0, 23.0, 17.0, 23.0, 17.0, 12.0, 9.0, 10.0, 12.0, 8.0, 9.0, 9.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.943883895874023, -20.214523315429688, -19.485164642333984, -18.75580406188965, -18.026443481445312, -17.29708480834961, -16.567724227905273, -15.838364601135254, -15.109004974365234, -14.379645347595215, -13.650285720825195, -12.92092514038086, -12.19156551361084, -11.46220588684082, -10.732845306396484, -10.003485679626465, -9.274126052856445, -8.544766426086426, -7.815406322479248, -7.08604621887207, -6.356686592102051, -5.627326965332031, -4.8979668617248535, -4.168606758117676, -3.4392471313476562, -2.7098872661590576, -1.980527400970459, -1.2511675357818604, -0.5218076705932617, 0.20755219459533691, 0.9369120597839355, 1.6662721633911133, 2.3956336975097656, 3.1249935626983643, 3.854353427886963, 4.583713531494141, 5.31307315826416, 6.04243278503418, 6.771792888641357, 7.501152992248535, 8.230512619018555, 8.959872245788574, 9.689231872558594, 10.41859245300293, 11.14795207977295, 11.877311706542969, 12.606672286987305, 13.336031913757324, 14.065391540527344, 14.794751167297363, 15.524110794067383, 16.25347137451172, 16.982830047607422, 17.712190628051758, 18.441551208496094, 19.170909881591797, 19.900270462036133, 20.62963104248047, 21.358989715576172, 22.088350296020508, 22.817710876464844, 23.547069549560547, 24.276430130004883, 25.00579071044922, 25.735149383544922]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 9.0, 6.0, 3.0, 8.0, 10.0, 11.0, 24.0, 21.0, 14.0, 38.0, 27.0, 45.0, 54.0, 71.0, 140.0, 231.0, 420.0, 848.0, 1801.0, 4504.0, 13468.0, 58380.0, 604054.0, 2936426.0, 502589.0, 51062.0, 12123.0, 4202.0, 1735.0, 821.0, 448.0, 211.0, 142.0, 85.0, 66.0, 34.0, 35.0, 26.0, 11.0, 16.0, 12.0, 13.0, 11.0, 7.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 2.0], "bins": [-16.484375, -16.006103515625, -15.52783203125, -15.049560546875, -14.5712890625, -14.093017578125, -13.61474609375, -13.136474609375, -12.658203125, -12.179931640625, -11.70166015625, -11.223388671875, -10.7451171875, -10.266845703125, -9.78857421875, -9.310302734375, -8.83203125, -8.353759765625, -7.87548828125, -7.397216796875, -6.9189453125, -6.440673828125, -5.96240234375, -5.484130859375, -5.005859375, -4.527587890625, -4.04931640625, -3.571044921875, -3.0927734375, -2.614501953125, -2.13623046875, -1.657958984375, -1.1796875, -0.701416015625, -0.22314453125, 0.255126953125, 0.7333984375, 1.211669921875, 1.68994140625, 2.168212890625, 2.646484375, 3.124755859375, 3.60302734375, 4.081298828125, 4.5595703125, 5.037841796875, 5.51611328125, 5.994384765625, 6.47265625, 6.950927734375, 7.42919921875, 7.907470703125, 8.3857421875, 8.864013671875, 9.34228515625, 9.820556640625, 10.298828125, 10.777099609375, 11.25537109375, 11.733642578125, 12.2119140625, 12.690185546875, 13.16845703125, 13.646728515625, 14.125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 10.0, 6.0, 10.0, 11.0, 17.0, 23.0, 30.0, 28.0, 23.0, 35.0, 48.0, 57.0, 48.0, 57.0, 51.0, 51.0, 55.0, 58.0, 49.0, 35.0, 37.0, 30.0, 44.0, 27.0, 32.0, 23.0, 18.0, 16.0, 13.0, 16.0, 6.0, 7.0, 9.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.554443359375, -6.31201171875, -6.069580078125, -5.8271484375, -5.584716796875, -5.34228515625, -5.099853515625, -4.857421875, -4.614990234375, -4.37255859375, -4.130126953125, -3.8876953125, -3.645263671875, -3.40283203125, -3.160400390625, -2.91796875, -2.675537109375, -2.43310546875, -2.190673828125, -1.9482421875, -1.705810546875, -1.46337890625, -1.220947265625, -0.978515625, -0.736083984375, -0.49365234375, -0.251220703125, -0.0087890625, 0.233642578125, 0.47607421875, 0.718505859375, 0.9609375, 1.203369140625, 1.44580078125, 1.688232421875, 1.9306640625, 2.173095703125, 2.41552734375, 2.657958984375, 2.900390625, 3.142822265625, 3.38525390625, 3.627685546875, 3.8701171875, 4.112548828125, 4.35498046875, 4.597412109375, 4.83984375, 5.082275390625, 5.32470703125, 5.567138671875, 5.8095703125, 6.052001953125, 6.29443359375, 6.536865234375, 6.779296875, 7.021728515625, 7.26416015625, 7.506591796875, 7.7490234375, 7.991455078125, 8.23388671875, 8.476318359375, 8.71875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 8.0, 17.0, 24.0, 33.0, 70.0, 186.0, 646.0, 14710.0, 4169045.0, 8597.0, 568.0, 186.0, 69.0, 25.0, 21.0, 13.0, 12.0, 6.0, 6.0, 4.0, 0.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-83.8125, -81.3798828125, -78.947265625, -76.5146484375, -74.08203125, -71.6494140625, -69.216796875, -66.7841796875, -64.3515625, -61.9189453125, -59.486328125, -57.0537109375, -54.62109375, -52.1884765625, -49.755859375, -47.3232421875, -44.890625, -42.4580078125, -40.025390625, -37.5927734375, -35.16015625, -32.7275390625, -30.294921875, -27.8623046875, -25.4296875, -22.9970703125, -20.564453125, -18.1318359375, -15.69921875, -13.2666015625, -10.833984375, -8.4013671875, -5.96875, -3.5361328125, -1.103515625, 1.3291015625, 3.76171875, 6.1943359375, 8.626953125, 11.0595703125, 13.4921875, 15.9248046875, 18.357421875, 20.7900390625, 23.22265625, 25.6552734375, 28.087890625, 30.5205078125, 32.953125, 35.3857421875, 37.818359375, 40.2509765625, 42.68359375, 45.1162109375, 47.548828125, 49.9814453125, 52.4140625, 54.8466796875, 57.279296875, 59.7119140625, 62.14453125, 64.5771484375, 67.009765625, 69.4423828125, 71.875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 13.0, 10.0, 15.0, 25.0, 57.0, 39.0, 88.0, 118.0, 182.0, 321.0, 562.0, 815.0, 719.0, 396.0, 238.0, 139.0, 107.0, 50.0, 58.0, 31.0, 28.0, 17.0, 9.0, 3.0, 8.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.2515869140625, -4.108642578125, -3.9656982421875, -3.82275390625, -3.6798095703125, -3.536865234375, -3.3939208984375, -3.2509765625, -3.1080322265625, -2.965087890625, -2.8221435546875, -2.67919921875, -2.5362548828125, -2.393310546875, -2.2503662109375, -2.107421875, -1.9644775390625, -1.821533203125, -1.6785888671875, -1.53564453125, -1.3927001953125, -1.249755859375, -1.1068115234375, -0.9638671875, -0.8209228515625, -0.677978515625, -0.5350341796875, -0.39208984375, -0.2491455078125, -0.106201171875, 0.0367431640625, 0.1796875, 0.3226318359375, 0.465576171875, 0.6085205078125, 0.75146484375, 0.8944091796875, 1.037353515625, 1.1802978515625, 1.3232421875, 1.4661865234375, 1.609130859375, 1.7520751953125, 1.89501953125, 2.0379638671875, 2.180908203125, 2.3238525390625, 2.466796875, 2.6097412109375, 2.752685546875, 2.8956298828125, 3.03857421875, 3.1815185546875, 3.324462890625, 3.4674072265625, 3.6103515625, 3.7532958984375, 3.896240234375, 4.0391845703125, 4.18212890625, 4.3250732421875, 4.468017578125, 4.6109619140625, 4.75390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 15.0, 23.0, 23.0, 24.0, 49.0, 42.0, 51.0, 65.0, 87.0, 93.0, 80.0, 79.0, 77.0, 55.0, 54.0, 39.0, 26.0, 17.0, 23.0, 17.0, 11.0, 13.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.073370933532715, -7.675901412963867, -7.2784318923950195, -6.880961894989014, -6.483492374420166, -6.086022853851318, -5.6885528564453125, -5.291083335876465, -4.893613815307617, -4.4961442947387695, -4.098674774169922, -3.701204776763916, -3.3037352561950684, -2.9062657356262207, -2.508795976638794, -2.111326217651367, -1.7138566970825195, -1.3163870573043823, -0.9189174175262451, -0.5214477777481079, -0.1239781379699707, 0.2734915018081665, 0.6709611415863037, 1.0684309005737305, 1.4659004211425781, 1.8633700609207153, 2.2608397006988525, 2.6583094596862793, 3.055778980255127, 3.4532485008239746, 3.8507182598114014, 4.248188018798828, 4.645656585693359, 5.043126106262207, 5.440595626831055, 5.8380656242370605, 6.235535144805908, 6.633004665374756, 7.030474662780762, 7.427944183349609, 7.825413703918457, 8.222883224487305, 8.620352745056152, 9.017822265625, 9.415292739868164, 9.812762260437012, 10.21023178100586, 10.607701301574707, 11.005170822143555, 11.402640342712402, 11.80010986328125, 12.197579383850098, 12.595048904418945, 12.99251937866211, 13.389988899230957, 13.787458419799805, 14.184927940368652, 14.5823974609375, 14.979866981506348, 15.377336502075195, 15.77480697631836, 16.17227554321289, 16.569746017456055, 16.96721649169922, 17.36468505859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 8.0, 4.0, 7.0, 9.0, 12.0, 12.0, 11.0, 13.0, 27.0, 30.0, 24.0, 32.0, 31.0, 48.0, 51.0, 37.0, 53.0, 51.0, 47.0, 45.0, 53.0, 43.0, 37.0, 40.0, 45.0, 32.0, 28.0, 21.0, 29.0, 25.0, 20.0, 10.0, 12.0, 15.0, 5.0, 9.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.543779373168945, -9.275174140930176, -9.00656795501709, -8.73796272277832, -8.469356536865234, -8.200751304626465, -7.932145595550537, -7.663539886474609, -7.394934177398682, -7.126328468322754, -6.857722759246826, -6.589117050170898, -6.320511817932129, -6.051905632019043, -5.783300399780273, -5.514694690704346, -5.246088981628418, -4.97748327255249, -4.7088775634765625, -4.440271854400635, -4.171666145324707, -3.9030606746673584, -3.6344552040100098, -3.365849494934082, -3.0972437858581543, -2.8286380767822266, -2.560032367706299, -2.29142689704895, -2.0228211879730225, -1.7542154788970947, -1.4856098890304565, -1.2170042991638184, -0.9483985900878906, -0.6797929406166077, -0.4111872911453247, -0.14258164167404175, 0.1260240077972412, 0.39462971687316895, 0.6632353067398071, 0.9318408966064453, 1.200446605682373, 1.4690523147583008, 1.737657904624939, 2.006263494491577, 2.274869203567505, 2.5434749126434326, 2.8120803833007812, 3.080686092376709, 3.3492918014526367, 3.6178975105285645, 3.886503219604492, 4.15510892868042, 4.423714637756348, 4.692319869995117, 4.960925579071045, 5.229531288146973, 5.4981369972229, 5.766742706298828, 6.035348415374756, 6.303954124450684, 6.572559356689453, 6.841165542602539, 7.109770774841309, 7.378376483917236, 7.646982192993164]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 6.0, 8.0, 18.0, 33.0, 44.0, 63.0, 132.0, 177.0, 342.0, 672.0, 1211.0, 2879.0, 7302.0, 19405.0, 57460.0, 189373.0, 409608.0, 244149.0, 75370.0, 24311.0, 8977.0, 3651.0, 1627.0, 777.0, 405.0, 215.0, 124.0, 67.0, 41.0, 23.0, 26.0, 12.0, 11.0, 3.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.9453125, -3.80743408203125, -3.6695556640625, -3.53167724609375, -3.393798828125, -3.25592041015625, -3.1180419921875, -2.98016357421875, -2.84228515625, -2.70440673828125, -2.5665283203125, -2.42864990234375, -2.290771484375, -2.15289306640625, -2.0150146484375, -1.87713623046875, -1.7392578125, -1.60137939453125, -1.4635009765625, -1.32562255859375, -1.187744140625, -1.04986572265625, -0.9119873046875, -0.77410888671875, -0.63623046875, -0.49835205078125, -0.3604736328125, -0.22259521484375, -0.084716796875, 0.05316162109375, 0.1910400390625, 0.32891845703125, 0.466796875, 0.60467529296875, 0.7425537109375, 0.88043212890625, 1.018310546875, 1.15618896484375, 1.2940673828125, 1.43194580078125, 1.56982421875, 1.70770263671875, 1.8455810546875, 1.98345947265625, 2.121337890625, 2.25921630859375, 2.3970947265625, 2.53497314453125, 2.6728515625, 2.81072998046875, 2.9486083984375, 3.08648681640625, 3.224365234375, 3.36224365234375, 3.5001220703125, 3.63800048828125, 3.77587890625, 3.91375732421875, 4.0516357421875, 4.18951416015625, 4.327392578125, 4.46527099609375, 4.6031494140625, 4.74102783203125, 4.87890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 11.0, 16.0, 22.0, 28.0, 43.0, 27.0, 33.0, 57.0, 73.0, 67.0, 62.0, 78.0, 71.0, 68.0, 70.0, 56.0, 39.0, 41.0, 31.0, 27.0, 19.0, 10.0, 11.0, 12.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-9.5703125, -9.3453369140625, -9.120361328125, -8.8953857421875, -8.67041015625, -8.4454345703125, -8.220458984375, -7.9954833984375, -7.7705078125, -7.5455322265625, -7.320556640625, -7.0955810546875, -6.87060546875, -6.6456298828125, -6.420654296875, -6.1956787109375, -5.970703125, -5.7457275390625, -5.520751953125, -5.2957763671875, -5.07080078125, -4.8458251953125, -4.620849609375, -4.3958740234375, -4.1708984375, -3.9459228515625, -3.720947265625, -3.4959716796875, -3.27099609375, -3.0460205078125, -2.821044921875, -2.5960693359375, -2.37109375, -2.1461181640625, -1.921142578125, -1.6961669921875, -1.47119140625, -1.2462158203125, -1.021240234375, -0.7962646484375, -0.5712890625, -0.3463134765625, -0.121337890625, 0.1036376953125, 0.32861328125, 0.5535888671875, 0.778564453125, 1.0035400390625, 1.228515625, 1.4534912109375, 1.678466796875, 1.9034423828125, 2.12841796875, 2.3533935546875, 2.578369140625, 2.8033447265625, 3.0283203125, 3.2532958984375, 3.478271484375, 3.7032470703125, 3.92822265625, 4.1531982421875, 4.378173828125, 4.6031494140625, 4.828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 7.0, 10.0, 18.0, 18.0, 36.0, 43.0, 57.0, 97.0, 161.0, 236.0, 440.0, 767.0, 1468.0, 2849.0, 6490.0, 15294.0, 40138.0, 114079.0, 289434.0, 336983.0, 151355.0, 53274.0, 19697.0, 8098.0, 3620.0, 1782.0, 874.0, 437.0, 274.0, 169.0, 115.0, 71.0, 57.0, 29.0, 19.0, 17.0, 10.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0546875, -2.953338623046875, -2.85198974609375, -2.750640869140625, -2.6492919921875, -2.547943115234375, -2.44659423828125, -2.345245361328125, -2.243896484375, -2.142547607421875, -2.04119873046875, -1.939849853515625, -1.8385009765625, -1.737152099609375, -1.63580322265625, -1.534454345703125, -1.43310546875, -1.331756591796875, -1.23040771484375, -1.129058837890625, -1.0277099609375, -0.926361083984375, -0.82501220703125, -0.723663330078125, -0.622314453125, -0.520965576171875, -0.41961669921875, -0.318267822265625, -0.2169189453125, -0.115570068359375, -0.01422119140625, 0.087127685546875, 0.1884765625, 0.289825439453125, 0.39117431640625, 0.492523193359375, 0.5938720703125, 0.695220947265625, 0.79656982421875, 0.897918701171875, 0.999267578125, 1.100616455078125, 1.20196533203125, 1.303314208984375, 1.4046630859375, 1.506011962890625, 1.60736083984375, 1.708709716796875, 1.81005859375, 1.911407470703125, 2.01275634765625, 2.114105224609375, 2.2154541015625, 2.316802978515625, 2.41815185546875, 2.519500732421875, 2.620849609375, 2.722198486328125, 2.82354736328125, 2.924896240234375, 3.0262451171875, 3.127593994140625, 3.22894287109375, 3.330291748046875, 3.431640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 10.0, 16.0, 16.0, 10.0, 20.0, 21.0, 21.0, 22.0, 33.0, 35.0, 35.0, 33.0, 43.0, 46.0, 37.0, 51.0, 47.0, 39.0, 44.0, 35.0, 53.0, 47.0, 54.0, 37.0, 33.0, 25.0, 15.0, 13.0, 18.0, 13.0, 23.0, 14.0, 9.0, 9.0, 5.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.3515625, -9.052001953125, -8.75244140625, -8.452880859375, -8.1533203125, -7.853759765625, -7.55419921875, -7.254638671875, -6.955078125, -6.655517578125, -6.35595703125, -6.056396484375, -5.7568359375, -5.457275390625, -5.15771484375, -4.858154296875, -4.55859375, -4.259033203125, -3.95947265625, -3.659912109375, -3.3603515625, -3.060791015625, -2.76123046875, -2.461669921875, -2.162109375, -1.862548828125, -1.56298828125, -1.263427734375, -0.9638671875, -0.664306640625, -0.36474609375, -0.065185546875, 0.234375, 0.533935546875, 0.83349609375, 1.133056640625, 1.4326171875, 1.732177734375, 2.03173828125, 2.331298828125, 2.630859375, 2.930419921875, 3.22998046875, 3.529541015625, 3.8291015625, 4.128662109375, 4.42822265625, 4.727783203125, 5.02734375, 5.326904296875, 5.62646484375, 5.926025390625, 6.2255859375, 6.525146484375, 6.82470703125, 7.124267578125, 7.423828125, 7.723388671875, 8.02294921875, 8.322509765625, 8.6220703125, 8.921630859375, 9.22119140625, 9.520751953125, 9.8203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 22.0, 24.0, 26.0, 61.0, 84.0, 133.0, 222.0, 360.0, 632.0, 1187.0, 2422.0, 5554.0, 13747.0, 40821.0, 137787.0, 379564.0, 314916.0, 100558.0, 30910.0, 10667.0, 4399.0, 2019.0, 1048.0, 542.0, 308.0, 177.0, 127.0, 58.0, 55.0, 25.0, 17.0, 20.0, 9.0, 14.0, 8.0, 8.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2393035888671875, -1.196380615234375, -1.1534576416015625, -1.11053466796875, -1.0676116943359375, -1.024688720703125, -0.9817657470703125, -0.9388427734375, -0.8959197998046875, -0.852996826171875, -0.8100738525390625, -0.76715087890625, -0.7242279052734375, -0.681304931640625, -0.6383819580078125, -0.595458984375, -0.5525360107421875, -0.509613037109375, -0.4666900634765625, -0.42376708984375, -0.3808441162109375, -0.337921142578125, -0.2949981689453125, -0.2520751953125, -0.2091522216796875, -0.166229248046875, -0.1233062744140625, -0.08038330078125, -0.0374603271484375, 0.005462646484375, 0.0483856201171875, 0.09130859375, 0.1342315673828125, 0.177154541015625, 0.2200775146484375, 0.26300048828125, 0.3059234619140625, 0.348846435546875, 0.3917694091796875, 0.4346923828125, 0.4776153564453125, 0.520538330078125, 0.5634613037109375, 0.60638427734375, 0.6493072509765625, 0.692230224609375, 0.7351531982421875, 0.778076171875, 0.8209991455078125, 0.863922119140625, 0.9068450927734375, 0.94976806640625, 0.9926910400390625, 1.035614013671875, 1.0785369873046875, 1.1214599609375, 1.1643829345703125, 1.207305908203125, 1.2502288818359375, 1.29315185546875, 1.3360748291015625, 1.378997802734375, 1.4219207763671875, 1.46484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 7.0, 14.0, 17.0, 14.0, 16.0, 25.0, 25.0, 33.0, 48.0, 45.0, 62.0, 62.0, 61.0, 72.0, 55.0, 53.0, 54.0, 49.0, 46.0, 40.0, 29.0, 28.0, 28.0, 17.0, 15.0, 13.0, 13.0, 8.0, 8.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0006613731384277344, -0.000642724335193634, -0.0006240755319595337, -0.0006054267287254333, -0.000586777925491333, -0.0005681291222572327, -0.0005494803190231323, -0.000530831515789032, -0.0005121827125549316, -0.0004935339093208313, -0.00047488510608673096, -0.0004562363028526306, -0.0004375874996185303, -0.00041893869638442993, -0.0004002898931503296, -0.00038164108991622925, -0.0003629922866821289, -0.00034434348344802856, -0.0003256946802139282, -0.0003070458769798279, -0.00028839707374572754, -0.0002697482705116272, -0.00025109946727752686, -0.00023245066404342651, -0.00021380186080932617, -0.00019515305757522583, -0.0001765042543411255, -0.00015785545110702515, -0.0001392066478729248, -0.00012055784463882446, -0.00010190904140472412, -8.326023817062378e-05, -6.461143493652344e-05, -4.5962631702423096e-05, -2.7313828468322754e-05, -8.665025234222412e-06, 9.98377799987793e-06, 2.863258123397827e-05, 4.728138446807861e-05, 6.593018770217896e-05, 8.45789909362793e-05, 0.00010322779417037964, 0.00012187659740447998, 0.00014052540063858032, 0.00015917420387268066, 0.000177823007106781, 0.00019647181034088135, 0.0002151206135749817, 0.00023376941680908203, 0.0002524182200431824, 0.0002710670232772827, 0.00028971582651138306, 0.0003083646297454834, 0.00032701343297958374, 0.0003456622362136841, 0.0003643110394477844, 0.00038295984268188477, 0.0004016086459159851, 0.00042025744915008545, 0.0004389062523841858, 0.00045755505561828613, 0.0004762038588523865, 0.0004948526620864868, 0.0005135014653205872, 0.0005321502685546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 2.0, 9.0, 8.0, 12.0, 17.0, 19.0, 27.0, 36.0, 58.0, 104.0, 137.0, 241.0, 389.0, 855.0, 1667.0, 3760.0, 9211.0, 26434.0, 86762.0, 270397.0, 393501.0, 174045.0, 52484.0, 16608.0, 6226.0, 2729.0, 1268.0, 607.0, 369.0, 207.0, 124.0, 64.0, 53.0, 25.0, 28.0, 20.0, 14.0, 11.0, 6.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.349609375, -1.3078155517578125, -1.266021728515625, -1.2242279052734375, -1.18243408203125, -1.1406402587890625, -1.098846435546875, -1.0570526123046875, -1.0152587890625, -0.9734649658203125, -0.931671142578125, -0.8898773193359375, -0.84808349609375, -0.8062896728515625, -0.764495849609375, -0.7227020263671875, -0.680908203125, -0.6391143798828125, -0.597320556640625, -0.5555267333984375, -0.51373291015625, -0.4719390869140625, -0.430145263671875, -0.3883514404296875, -0.3465576171875, -0.3047637939453125, -0.262969970703125, -0.2211761474609375, -0.17938232421875, -0.1375885009765625, -0.095794677734375, -0.0540008544921875, -0.01220703125, 0.0295867919921875, 0.071380615234375, 0.1131744384765625, 0.15496826171875, 0.1967620849609375, 0.238555908203125, 0.2803497314453125, 0.3221435546875, 0.3639373779296875, 0.405731201171875, 0.4475250244140625, 0.48931884765625, 0.5311126708984375, 0.572906494140625, 0.6147003173828125, 0.656494140625, 0.6982879638671875, 0.740081787109375, 0.7818756103515625, 0.82366943359375, 0.8654632568359375, 0.907257080078125, 0.9490509033203125, 0.9908447265625, 1.0326385498046875, 1.074432373046875, 1.1162261962890625, 1.15802001953125, 1.1998138427734375, 1.241607666015625, 1.2834014892578125, 1.3251953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 5.0, 6.0, 7.0, 6.0, 12.0, 22.0, 12.0, 26.0, 22.0, 27.0, 23.0, 46.0, 27.0, 38.0, 70.0, 52.0, 59.0, 56.0, 57.0, 70.0, 53.0, 54.0, 37.0, 45.0, 26.0, 25.0, 16.0, 24.0, 18.0, 18.0, 8.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.304931640625, -0.2956962585449219, -0.28646087646484375, -0.2772254943847656, -0.2679901123046875, -0.2587547302246094, -0.24951934814453125, -0.24028396606445312, -0.231048583984375, -0.22181320190429688, -0.21257781982421875, -0.20334243774414062, -0.1941070556640625, -0.18487167358398438, -0.17563629150390625, -0.16640090942382812, -0.15716552734375, -0.14793014526367188, -0.13869476318359375, -0.12945938110351562, -0.1202239990234375, -0.11098861694335938, -0.10175323486328125, -0.09251785278320312, -0.083282470703125, -0.07404708862304688, -0.06481170654296875, -0.055576324462890625, -0.0463409423828125, -0.037105560302734375, -0.02787017822265625, -0.018634796142578125, -0.0093994140625, -0.000164031982421875, 0.00907135009765625, 0.018306732177734375, 0.0275421142578125, 0.036777496337890625, 0.04601287841796875, 0.055248260498046875, 0.064483642578125, 0.07371902465820312, 0.08295440673828125, 0.09218978881835938, 0.1014251708984375, 0.11066055297851562, 0.11989593505859375, 0.12913131713867188, 0.13836669921875, 0.14760208129882812, 0.15683746337890625, 0.16607284545898438, 0.1753082275390625, 0.18454360961914062, 0.19377899169921875, 0.20301437377929688, 0.212249755859375, 0.22148513793945312, 0.23072052001953125, 0.23995590209960938, 0.2491912841796875, 0.2584266662597656, 0.26766204833984375, 0.2768974304199219, 0.2861328125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 10.0, 7.0, 13.0, 20.0, 18.0, 44.0, 58.0, 61.0, 75.0, 95.0, 100.0, 101.0, 78.0, 83.0, 55.0, 45.0, 25.0, 23.0, 24.0, 19.0, 13.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.933866024017334, -4.675630569458008, -4.417394638061523, -4.159159183502197, -3.900923728942871, -3.642688274383545, -3.3844525814056396, -3.1262168884277344, -2.867981433868408, -2.609745979309082, -2.3515102863311768, -2.0932745933532715, -1.8350391387939453, -1.5768035650253296, -1.3185679912567139, -1.0603324174880981, -0.8020968437194824, -0.5438612699508667, -0.285625696182251, -0.027390122413635254, 0.23084545135498047, 0.4890810251235962, 0.7473165988922119, 1.0055521726608276, 1.2637877464294434, 1.522023320198059, 1.7802588939666748, 2.03849458694458, 2.2967300415039062, 2.5549654960632324, 2.8132011890411377, 3.071436882019043, 3.329671859741211, 3.587907314300537, 3.8461430072784424, 4.104378700256348, 4.362614154815674, 4.620849609375, 4.879085540771484, 5.1373209953308105, 5.395556449890137, 5.653791904449463, 5.912027359008789, 6.170263290405273, 6.4284987449646, 6.686734199523926, 6.94497013092041, 7.203205585479736, 7.4614410400390625, 7.719676494598389, 7.977911949157715, 8.2361478805542, 8.494382858276367, 8.752618789672852, 9.010854721069336, 9.269089698791504, 9.527325630187988, 9.785561561584473, 10.04379653930664, 10.302032470703125, 10.56026840209961, 10.818503379821777, 11.076739311218262, 11.33497428894043, 11.593210220336914]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 3.0, 10.0, 13.0, 18.0, 20.0, 23.0, 36.0, 23.0, 48.0, 38.0, 55.0, 65.0, 53.0, 52.0, 59.0, 56.0, 68.0, 47.0, 49.0, 36.0, 41.0, 41.0, 23.0, 25.0, 16.0, 12.0, 14.0, 12.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.4476823806762695, -6.265778064727783, -6.083873748779297, -5.901969909667969, -5.720065593719482, -5.538161277770996, -5.35625696182251, -5.174352645874023, -4.992448806762695, -4.810544490814209, -4.628640174865723, -4.4467363357543945, -4.264832019805908, -4.082927703857422, -3.9010233879089355, -3.719119071960449, -3.537214756011963, -3.3553104400634766, -3.1734063625335693, -2.991502046585083, -2.809597969055176, -2.6276936531066895, -2.445789337158203, -2.263885021209717, -2.0819809436798096, -1.9000767469406128, -1.718172550201416, -1.5362682342529297, -1.354364037513733, -1.1724598407745361, -0.9905555248260498, -0.808651328086853, -0.626746654510498, -0.4448424279689789, -0.2629382014274597, -0.08103394508361816, 0.10087025165557861, 0.2827744483947754, 0.4646787643432617, 0.6465829610824585, 0.8284871578216553, 1.010391354560852, 1.1922955513000488, 1.3741998672485352, 1.556104063987732, 1.7380082607269287, 1.919912576675415, 2.1018166542053223, 2.2837209701538086, 2.465625286102295, 2.647529363632202, 2.8294336795806885, 3.0113377571105957, 3.193242073059082, 3.3751463890075684, 3.5570507049560547, 3.738954782485962, 3.9208590984344482, 4.1027631759643555, 4.284667491912842, 4.466571807861328, 4.648475646972656, 4.830380439758301, 5.012284278869629, 5.194188594818115]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 11.0, 15.0, 24.0, 60.0, 76.0, 131.0, 235.0, 498.0, 1079.0, 2551.0, 6874.0, 21585.0, 90725.0, 606178.0, 252253.0, 45816.0, 12694.0, 4393.0, 1764.0, 781.0, 391.0, 183.0, 106.0, 53.0, 24.0, 21.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.265625, -9.013671875, -8.76171875, -8.509765625, -8.2578125, -8.005859375, -7.75390625, -7.501953125, -7.25, -6.998046875, -6.74609375, -6.494140625, -6.2421875, -5.990234375, -5.73828125, -5.486328125, -5.234375, -4.982421875, -4.73046875, -4.478515625, -4.2265625, -3.974609375, -3.72265625, -3.470703125, -3.21875, -2.966796875, -2.71484375, -2.462890625, -2.2109375, -1.958984375, -1.70703125, -1.455078125, -1.203125, -0.951171875, -0.69921875, -0.447265625, -0.1953125, 0.056640625, 0.30859375, 0.560546875, 0.8125, 1.064453125, 1.31640625, 1.568359375, 1.8203125, 2.072265625, 2.32421875, 2.576171875, 2.828125, 3.080078125, 3.33203125, 3.583984375, 3.8359375, 4.087890625, 4.33984375, 4.591796875, 4.84375, 5.095703125, 5.34765625, 5.599609375, 5.8515625, 6.103515625, 6.35546875, 6.607421875, 6.859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 7.0, 12.0, 28.0, 16.0, 26.0, 43.0, 34.0, 43.0, 32.0, 52.0, 56.0, 57.0, 59.0, 61.0, 51.0, 58.0, 45.0, 51.0, 47.0, 35.0, 32.0, 27.0, 14.0, 23.0, 16.0, 11.0, 7.0, 9.0, 3.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.41455078125, -11.0244140625, -10.63427734375, -10.244140625, -9.85400390625, -9.4638671875, -9.07373046875, -8.68359375, -8.29345703125, -7.9033203125, -7.51318359375, -7.123046875, -6.73291015625, -6.3427734375, -5.95263671875, -5.5625, -5.17236328125, -4.7822265625, -4.39208984375, -4.001953125, -3.61181640625, -3.2216796875, -2.83154296875, -2.44140625, -2.05126953125, -1.6611328125, -1.27099609375, -0.880859375, -0.49072265625, -0.1005859375, 0.28955078125, 0.6796875, 1.06982421875, 1.4599609375, 1.85009765625, 2.240234375, 2.63037109375, 3.0205078125, 3.41064453125, 3.80078125, 4.19091796875, 4.5810546875, 4.97119140625, 5.361328125, 5.75146484375, 6.1416015625, 6.53173828125, 6.921875, 7.31201171875, 7.7021484375, 8.09228515625, 8.482421875, 8.87255859375, 9.2626953125, 9.65283203125, 10.04296875, 10.43310546875, 10.8232421875, 11.21337890625, 11.603515625, 11.99365234375, 12.3837890625, 12.77392578125, 13.1640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 9.0, 11.0, 11.0, 17.0, 9.0, 26.0, 33.0, 31.0, 39.0, 49.0, 51.0, 90.0, 363.0, 89971.0, 956387.0, 1014.0, 104.0, 72.0, 51.0, 59.0, 30.0, 30.0, 16.0, 15.0, 18.0, 13.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3125, -65.54736328125, -63.7822265625, -62.01708984375, -60.251953125, -58.48681640625, -56.7216796875, -54.95654296875, -53.19140625, -51.42626953125, -49.6611328125, -47.89599609375, -46.130859375, -44.36572265625, -42.6005859375, -40.83544921875, -39.0703125, -37.30517578125, -35.5400390625, -33.77490234375, -32.009765625, -30.24462890625, -28.4794921875, -26.71435546875, -24.94921875, -23.18408203125, -21.4189453125, -19.65380859375, -17.888671875, -16.12353515625, -14.3583984375, -12.59326171875, -10.828125, -9.06298828125, -7.2978515625, -5.53271484375, -3.767578125, -2.00244140625, -0.2373046875, 1.52783203125, 3.29296875, 5.05810546875, 6.8232421875, 8.58837890625, 10.353515625, 12.11865234375, 13.8837890625, 15.64892578125, 17.4140625, 19.17919921875, 20.9443359375, 22.70947265625, 24.474609375, 26.23974609375, 28.0048828125, 29.77001953125, 31.53515625, 33.30029296875, 35.0654296875, 36.83056640625, 38.595703125, 40.36083984375, 42.1259765625, 43.89111328125, 45.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 12.0, 11.0, 11.0, 17.0, 24.0, 30.0, 45.0, 28.0, 58.0, 51.0, 71.0, 65.0, 59.0, 66.0, 57.0, 50.0, 59.0, 56.0, 58.0, 36.0, 28.0, 25.0, 15.0, 16.0, 14.0, 4.0, 8.0, 9.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.140625, -19.63818359375, -19.1357421875, -18.63330078125, -18.130859375, -17.62841796875, -17.1259765625, -16.62353515625, -16.12109375, -15.61865234375, -15.1162109375, -14.61376953125, -14.111328125, -13.60888671875, -13.1064453125, -12.60400390625, -12.1015625, -11.59912109375, -11.0966796875, -10.59423828125, -10.091796875, -9.58935546875, -9.0869140625, -8.58447265625, -8.08203125, -7.57958984375, -7.0771484375, -6.57470703125, -6.072265625, -5.56982421875, -5.0673828125, -4.56494140625, -4.0625, -3.56005859375, -3.0576171875, -2.55517578125, -2.052734375, -1.55029296875, -1.0478515625, -0.54541015625, -0.04296875, 0.45947265625, 0.9619140625, 1.46435546875, 1.966796875, 2.46923828125, 2.9716796875, 3.47412109375, 3.9765625, 4.47900390625, 4.9814453125, 5.48388671875, 5.986328125, 6.48876953125, 6.9912109375, 7.49365234375, 7.99609375, 8.49853515625, 9.0009765625, 9.50341796875, 10.005859375, 10.50830078125, 11.0107421875, 11.51318359375, 12.015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 10.0, 11.0, 22.0, 15.0, 26.0, 34.0, 51.0, 67.0, 116.0, 191.0, 361.0, 597.0, 1371.0, 3260.0, 9154.0, 32447.0, 166301.0, 708179.0, 93960.0, 21096.0, 6447.0, 2533.0, 1018.0, 536.0, 281.0, 158.0, 105.0, 64.0, 40.0, 27.0, 14.0, 18.0, 9.0, 6.0, 4.0, 6.0, 7.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.4532470703125, -2.363525390625, -2.2738037109375, -2.18408203125, -2.0943603515625, -2.004638671875, -1.9149169921875, -1.8251953125, -1.7354736328125, -1.645751953125, -1.5560302734375, -1.46630859375, -1.3765869140625, -1.286865234375, -1.1971435546875, -1.107421875, -1.0177001953125, -0.927978515625, -0.8382568359375, -0.74853515625, -0.6588134765625, -0.569091796875, -0.4793701171875, -0.3896484375, -0.2999267578125, -0.210205078125, -0.1204833984375, -0.03076171875, 0.0589599609375, 0.148681640625, 0.2384033203125, 0.328125, 0.4178466796875, 0.507568359375, 0.5972900390625, 0.68701171875, 0.7767333984375, 0.866455078125, 0.9561767578125, 1.0458984375, 1.1356201171875, 1.225341796875, 1.3150634765625, 1.40478515625, 1.4945068359375, 1.584228515625, 1.6739501953125, 1.763671875, 1.8533935546875, 1.943115234375, 2.0328369140625, 2.12255859375, 2.2122802734375, 2.302001953125, 2.3917236328125, 2.4814453125, 2.5711669921875, 2.660888671875, 2.7506103515625, 2.84033203125, 2.9300537109375, 3.019775390625, 3.1094970703125, 3.19921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 13.0, 15.0, 25.0, 20.0, 38.0, 56.0, 100.0, 192.0, 253.0, 94.0, 55.0, 37.0, 33.0, 23.0, 11.0, 7.0, 9.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038909912109375, -0.0003706887364387512, -0.00035227835178375244, -0.00033386796712875366, -0.0003154575824737549, -0.0002970471978187561, -0.0002786368131637573, -0.00026022642850875854, -0.00024181604385375977, -0.00022340565919876099, -0.0002049952745437622, -0.00018658488988876343, -0.00016817450523376465, -0.00014976412057876587, -0.0001313537359237671, -0.00011294335126876831, -9.453296661376953e-05, -7.612258195877075e-05, -5.771219730377197e-05, -3.930181264877319e-05, -2.0891427993774414e-05, -2.4810433387756348e-06, 1.5929341316223145e-05, 3.4339725971221924e-05, 5.27501106262207e-05, 7.116049528121948e-05, 8.957087993621826e-05, 0.00010798126459121704, 0.00012639164924621582, 0.0001448020339012146, 0.00016321241855621338, 0.00018162280321121216, 0.00020003318786621094, 0.00021844357252120972, 0.0002368539571762085, 0.0002552643418312073, 0.00027367472648620605, 0.00029208511114120483, 0.0003104954957962036, 0.0003289058804512024, 0.00034731626510620117, 0.00036572664976119995, 0.00038413703441619873, 0.0004025474190711975, 0.0004209578037261963, 0.00043936818838119507, 0.00045777857303619385, 0.0004761889576911926, 0.0004945993423461914, 0.0005130097270011902, 0.000531420111656189, 0.0005498304963111877, 0.0005682408809661865, 0.0005866512656211853, 0.0006050616502761841, 0.0006234720349311829, 0.0006418824195861816, 0.0006602928042411804, 0.0006787031888961792, 0.000697113573551178, 0.0007155239582061768, 0.0007339343428611755, 0.0007523447275161743, 0.0007707551121711731, 0.0007891654968261719]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 5.0, 4.0, 9.0, 12.0, 12.0, 32.0, 46.0, 82.0, 142.0, 262.0, 486.0, 1034.0, 2343.0, 5939.0, 19098.0, 83532.0, 697340.0, 187381.0, 34492.0, 9709.0, 3538.0, 1506.0, 705.0, 371.0, 187.0, 119.0, 68.0, 33.0, 20.0, 21.0, 11.0, 7.0, 4.0, 2.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.654296875, -2.564971923828125, -2.47564697265625, -2.386322021484375, -2.2969970703125, -2.207672119140625, -2.11834716796875, -2.029022216796875, -1.939697265625, -1.850372314453125, -1.76104736328125, -1.671722412109375, -1.5823974609375, -1.493072509765625, -1.40374755859375, -1.314422607421875, -1.22509765625, -1.135772705078125, -1.04644775390625, -0.957122802734375, -0.8677978515625, -0.778472900390625, -0.68914794921875, -0.599822998046875, -0.510498046875, -0.421173095703125, -0.33184814453125, -0.242523193359375, -0.1531982421875, -0.063873291015625, 0.02545166015625, 0.114776611328125, 0.2041015625, 0.293426513671875, 0.38275146484375, 0.472076416015625, 0.5614013671875, 0.650726318359375, 0.74005126953125, 0.829376220703125, 0.918701171875, 1.008026123046875, 1.09735107421875, 1.186676025390625, 1.2760009765625, 1.365325927734375, 1.45465087890625, 1.543975830078125, 1.63330078125, 1.722625732421875, 1.81195068359375, 1.901275634765625, 1.9906005859375, 2.079925537109375, 2.16925048828125, 2.258575439453125, 2.347900390625, 2.437225341796875, 2.52655029296875, 2.615875244140625, 2.7052001953125, 2.794525146484375, 2.88385009765625, 2.973175048828125, 3.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 7.0, 17.0, 15.0, 21.0, 27.0, 38.0, 38.0, 60.0, 80.0, 272.0, 97.0, 57.0, 44.0, 42.0, 29.0, 27.0, 22.0, 25.0, 14.0, 10.0, 9.0, 5.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71142578125, -0.6751480102539062, -0.6388702392578125, -0.6025924682617188, -0.566314697265625, -0.5300369262695312, -0.4937591552734375, -0.45748138427734375, -0.42120361328125, -0.38492584228515625, -0.3486480712890625, -0.31237030029296875, -0.276092529296875, -0.23981475830078125, -0.2035369873046875, -0.16725921630859375, -0.1309814453125, -0.09470367431640625, -0.0584259033203125, -0.02214813232421875, 0.014129638671875, 0.05040740966796875, 0.0866851806640625, 0.12296295166015625, 0.15924072265625, 0.19551849365234375, 0.2317962646484375, 0.26807403564453125, 0.304351806640625, 0.34062957763671875, 0.3769073486328125, 0.41318511962890625, 0.449462890625, 0.48574066162109375, 0.5220184326171875, 0.5582962036132812, 0.594573974609375, 0.6308517456054688, 0.6671295166015625, 0.7034072875976562, 0.73968505859375, 0.7759628295898438, 0.8122406005859375, 0.8485183715820312, 0.884796142578125, 0.9210739135742188, 0.9573516845703125, 0.9936294555664062, 1.0299072265625, 1.0661849975585938, 1.1024627685546875, 1.1387405395507812, 1.175018310546875, 1.2112960815429688, 1.2475738525390625, 1.2838516235351562, 1.32012939453125, 1.3564071655273438, 1.3926849365234375, 1.4289627075195312, 1.465240478515625, 1.5015182495117188, 1.5377960205078125, 1.5740737915039062, 1.6103515625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 22.0, 99.0, 316.0, 367.0, 147.0, 47.0, 7.0, 7.0, 1.0, 0.0, 1.0], "bins": [-125.51412200927734, -123.28372955322266, -121.05333709716797, -118.82294464111328, -116.59255981445312, -114.36216735839844, -112.13177490234375, -109.90138244628906, -107.67098999023438, -105.44059753417969, -103.210205078125, -100.97981262207031, -98.74942016601562, -96.51903533935547, -94.28864288330078, -92.0582504272461, -89.8278579711914, -87.59746551513672, -85.36707305908203, -83.13668060302734, -80.90629577636719, -78.6759033203125, -76.44551086425781, -74.21511840820312, -71.98472595214844, -69.75433349609375, -67.52394104003906, -65.29354858398438, -63.06315994262695, -60.832767486572266, -58.602378845214844, -56.371986389160156, -54.14158630371094, -51.91119384765625, -49.68080139160156, -47.45041275024414, -45.22002029418945, -42.989627838134766, -40.759239196777344, -38.528846740722656, -36.29845428466797, -34.06806182861328, -31.837671279907227, -29.607280731201172, -27.376888275146484, -25.146495819091797, -22.916105270385742, -20.685714721679688, -18.455324172973633, -16.224933624267578, -13.99454116821289, -11.76414966583252, -9.533758163452148, -7.303366661071777, -5.072975158691406, -2.842583656311035, -0.6121921539306641, 1.618199348449707, 3.848590850830078, 6.078982353210449, 8.30937385559082, 10.539765357971191, 12.770156860351562, 15.000548362731934, 17.230939865112305]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 3.0, 4.0, 10.0, 9.0, 10.0, 9.0, 17.0, 14.0, 18.0, 23.0, 22.0, 34.0, 24.0, 38.0, 31.0, 42.0, 46.0, 36.0, 41.0, 43.0, 54.0, 50.0, 44.0, 43.0, 39.0, 47.0, 39.0, 31.0, 37.0, 21.0, 22.0, 23.0, 12.0, 14.0, 15.0, 8.0, 3.0, 9.0, 2.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.739897727966309, -13.230113983154297, -12.720330238342285, -12.210546493530273, -11.700762748718262, -11.19097900390625, -10.681195259094238, -10.171411514282227, -9.661627769470215, -9.151844024658203, -8.642060279846191, -8.13227653503418, -7.622492790222168, -7.112709045410156, -6.6029253005981445, -6.093141555786133, -5.583357810974121, -5.073574066162109, -4.563790321350098, -4.054006576538086, -3.544222831726074, -3.0344390869140625, -2.524655342102051, -2.014871597290039, -1.5050878524780273, -0.9953041076660156, -0.4855203628540039, 0.024263381958007812, 0.5340471267700195, 1.0438308715820312, 1.553614616394043, 2.0633983612060547, 2.57318115234375, 3.0829648971557617, 3.5927486419677734, 4.102532386779785, 4.612316131591797, 5.122099876403809, 5.63188362121582, 6.141667366027832, 6.651451110839844, 7.1612348556518555, 7.671018600463867, 8.180802345275879, 8.69058609008789, 9.200369834899902, 9.710153579711914, 10.219937324523926, 10.729721069335938, 11.23950481414795, 11.749288558959961, 12.259072303771973, 12.768856048583984, 13.278639793395996, 13.788423538208008, 14.29820728302002, 14.807991027832031, 15.317774772644043, 15.827558517456055, 16.33734130859375, 16.847126007080078, 17.356910705566406, 17.8666934967041, 18.376476287841797, 18.886260986328125]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 7.0, 18.0, 20.0, 23.0, 27.0, 70.0, 125.0, 204.0, 399.0, 754.0, 1791.0, 4335.0, 13295.0, 61693.0, 688070.0, 2982350.0, 384360.0, 40644.0, 9716.0, 3384.0, 1424.0, 680.0, 376.0, 192.0, 112.0, 69.0, 29.0, 22.0, 16.0, 23.0, 13.0, 15.0, 4.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.364990234375, -12.92529296875, -12.485595703125, -12.0458984375, -11.606201171875, -11.16650390625, -10.726806640625, -10.287109375, -9.847412109375, -9.40771484375, -8.968017578125, -8.5283203125, -8.088623046875, -7.64892578125, -7.209228515625, -6.76953125, -6.329833984375, -5.89013671875, -5.450439453125, -5.0107421875, -4.571044921875, -4.13134765625, -3.691650390625, -3.251953125, -2.812255859375, -2.37255859375, -1.932861328125, -1.4931640625, -1.053466796875, -0.61376953125, -0.174072265625, 0.265625, 0.705322265625, 1.14501953125, 1.584716796875, 2.0244140625, 2.464111328125, 2.90380859375, 3.343505859375, 3.783203125, 4.222900390625, 4.66259765625, 5.102294921875, 5.5419921875, 5.981689453125, 6.42138671875, 6.861083984375, 7.30078125, 7.740478515625, 8.18017578125, 8.619873046875, 9.0595703125, 9.499267578125, 9.93896484375, 10.378662109375, 10.818359375, 11.258056640625, 11.69775390625, 12.137451171875, 12.5771484375, 13.016845703125, 13.45654296875, 13.896240234375, 14.3359375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 7.0, 3.0, 16.0, 16.0, 21.0, 12.0, 30.0, 35.0, 36.0, 34.0, 50.0, 61.0, 63.0, 61.0, 51.0, 58.0, 38.0, 57.0, 46.0, 58.0, 45.0, 30.0, 41.0, 21.0, 16.0, 22.0, 19.0, 9.0, 9.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.12017822265625, -5.8848876953125, -5.64959716796875, -5.414306640625, -5.17901611328125, -4.9437255859375, -4.70843505859375, -4.47314453125, -4.23785400390625, -4.0025634765625, -3.76727294921875, -3.531982421875, -3.29669189453125, -3.0614013671875, -2.82611083984375, -2.5908203125, -2.35552978515625, -2.1202392578125, -1.88494873046875, -1.649658203125, -1.41436767578125, -1.1790771484375, -0.94378662109375, -0.70849609375, -0.47320556640625, -0.2379150390625, -0.00262451171875, 0.232666015625, 0.46795654296875, 0.7032470703125, 0.93853759765625, 1.173828125, 1.40911865234375, 1.6444091796875, 1.87969970703125, 2.114990234375, 2.35028076171875, 2.5855712890625, 2.82086181640625, 3.05615234375, 3.29144287109375, 3.5267333984375, 3.76202392578125, 3.997314453125, 4.23260498046875, 4.4678955078125, 4.70318603515625, 4.9384765625, 5.17376708984375, 5.4090576171875, 5.64434814453125, 5.879638671875, 6.11492919921875, 6.3502197265625, 6.58551025390625, 6.82080078125, 7.05609130859375, 7.2913818359375, 7.52667236328125, 7.761962890625, 7.99725341796875, 8.2325439453125, 8.46783447265625, 8.703125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 14.0, 26.0, 53.0, 108.0, 285.0, 1851.0, 177491.0, 4005482.0, 8052.0, 555.0, 165.0, 64.0, 41.0, 27.0, 12.0, 13.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-50.9375, -49.4912109375, -48.044921875, -46.5986328125, -45.15234375, -43.7060546875, -42.259765625, -40.8134765625, -39.3671875, -37.9208984375, -36.474609375, -35.0283203125, -33.58203125, -32.1357421875, -30.689453125, -29.2431640625, -27.796875, -26.3505859375, -24.904296875, -23.4580078125, -22.01171875, -20.5654296875, -19.119140625, -17.6728515625, -16.2265625, -14.7802734375, -13.333984375, -11.8876953125, -10.44140625, -8.9951171875, -7.548828125, -6.1025390625, -4.65625, -3.2099609375, -1.763671875, -0.3173828125, 1.12890625, 2.5751953125, 4.021484375, 5.4677734375, 6.9140625, 8.3603515625, 9.806640625, 11.2529296875, 12.69921875, 14.1455078125, 15.591796875, 17.0380859375, 18.484375, 19.9306640625, 21.376953125, 22.8232421875, 24.26953125, 25.7158203125, 27.162109375, 28.6083984375, 30.0546875, 31.5009765625, 32.947265625, 34.3935546875, 35.83984375, 37.2861328125, 38.732421875, 40.1787109375, 41.625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 5.0, 13.0, 14.0, 14.0, 28.0, 40.0, 46.0, 60.0, 93.0, 113.0, 184.0, 291.0, 425.0, 661.0, 602.0, 480.0, 323.0, 197.0, 143.0, 90.0, 64.0, 49.0, 30.0, 24.0, 34.0, 15.0, 11.0, 3.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.71484375, -3.61199951171875, -3.5091552734375, -3.40631103515625, -3.303466796875, -3.20062255859375, -3.0977783203125, -2.99493408203125, -2.89208984375, -2.78924560546875, -2.6864013671875, -2.58355712890625, -2.480712890625, -2.37786865234375, -2.2750244140625, -2.17218017578125, -2.0693359375, -1.96649169921875, -1.8636474609375, -1.76080322265625, -1.657958984375, -1.55511474609375, -1.4522705078125, -1.34942626953125, -1.24658203125, -1.14373779296875, -1.0408935546875, -0.93804931640625, -0.835205078125, -0.73236083984375, -0.6295166015625, -0.52667236328125, -0.423828125, -0.32098388671875, -0.2181396484375, -0.11529541015625, -0.012451171875, 0.09039306640625, 0.1932373046875, 0.29608154296875, 0.39892578125, 0.50177001953125, 0.6046142578125, 0.70745849609375, 0.810302734375, 0.91314697265625, 1.0159912109375, 1.11883544921875, 1.2216796875, 1.32452392578125, 1.4273681640625, 1.53021240234375, 1.633056640625, 1.73590087890625, 1.8387451171875, 1.94158935546875, 2.04443359375, 2.14727783203125, 2.2501220703125, 2.35296630859375, 2.455810546875, 2.55865478515625, 2.6614990234375, 2.76434326171875, 2.8671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 23.0, 22.0, 39.0, 61.0, 88.0, 90.0, 110.0, 126.0, 107.0, 84.0, 65.0, 40.0, 42.0, 29.0, 18.0, 13.0, 6.0, 10.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.584258079528809, -10.113957405090332, -9.643655776977539, -9.173355102539062, -8.70305347442627, -8.232752799987793, -7.762451648712158, -7.292150497436523, -6.821849346160889, -6.351548194885254, -5.881247043609619, -5.410945892333984, -4.940645217895508, -4.470343589782715, -4.000042915344238, -3.5297417640686035, -3.0594406127929688, -2.589139461517334, -2.118838310241699, -1.6485373973846436, -1.1782362461090088, -0.707935094833374, -0.23763418197631836, 0.2326669692993164, 0.7029681205749512, 1.173269271850586, 1.6435703039169312, 2.1138713359832764, 2.584172487258911, 3.054473638534546, 3.5247745513916016, 3.9950757026672363, 4.4653778076171875, 4.935678958892822, 5.405980110168457, 5.876280784606934, 6.346582412719727, 6.816883087158203, 7.287184238433838, 7.757485389709473, 8.227787017822266, 8.698087692260742, 9.168389320373535, 9.638689994812012, 10.108991622924805, 10.579292297363281, 11.049592971801758, 11.51989459991455, 11.990195274353027, 12.460495948791504, 12.930797576904297, 13.401098251342773, 13.871399879455566, 14.341700553894043, 14.812002182006836, 15.282302856445312, 15.752603530883789, 16.222904205322266, 16.693204879760742, 17.16350746154785, 17.633808135986328, 18.104108810424805, 18.57440948486328, 19.04471206665039, 19.515012741088867]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 1.0, 5.0, 8.0, 4.0, 7.0, 15.0, 15.0, 13.0, 21.0, 17.0, 25.0, 41.0, 42.0, 26.0, 37.0, 43.0, 45.0, 48.0, 47.0, 46.0, 59.0, 42.0, 51.0, 45.0, 41.0, 34.0, 33.0, 36.0, 29.0, 30.0, 12.0, 10.0, 23.0, 7.0, 5.0, 4.0, 10.0, 4.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.390345573425293, -7.156287670135498, -6.922229766845703, -6.688171863555908, -6.454113960266113, -6.220056056976318, -5.985998153686523, -5.751940727233887, -5.517882347106934, -5.283824443817139, -5.049766540527344, -4.815708637237549, -4.581650733947754, -4.347592830657959, -4.113534927368164, -3.8794772624969482, -3.6454195976257324, -3.4113616943359375, -3.1773037910461426, -2.9432458877563477, -2.7091879844665527, -2.475130081176758, -2.241072416305542, -2.007014513015747, -1.7729566097259521, -1.5388987064361572, -1.3048408031463623, -1.070783019065857, -0.836725115776062, -0.6026672124862671, -0.3686094284057617, -0.1345515251159668, 0.09950590133666992, 0.33356377482414246, 0.567621648311615, 0.8016794919967651, 1.03573739528656, 1.269795298576355, 1.5038530826568604, 1.7379109859466553, 1.9719688892364502, 2.206026792526245, 2.44008469581604, 2.674142360687256, 2.908200263977051, 3.1422581672668457, 3.3763160705566406, 3.6103739738464355, 3.8444318771362305, 4.078489780426025, 4.31254768371582, 4.546605587005615, 4.78066349029541, 5.014721393585205, 5.248779296875, 5.482836723327637, 5.71689510345459, 5.950953006744385, 6.18501091003418, 6.419068813323975, 6.6531267166137695, 6.8871846199035645, 7.121242523193359, 7.355299949645996, 7.589357852935791]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 7.0, 9.0, 17.0, 13.0, 23.0, 26.0, 40.0, 89.0, 185.0, 352.0, 988.0, 3157.0, 12995.0, 67491.0, 460773.0, 423665.0, 62159.0, 11942.0, 2931.0, 941.0, 352.0, 152.0, 85.0, 56.0, 43.0, 29.0, 6.0, 7.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.19232177734375, -4.0174560546875, -3.84259033203125, -3.667724609375, -3.49285888671875, -3.3179931640625, -3.14312744140625, -2.96826171875, -2.79339599609375, -2.6185302734375, -2.44366455078125, -2.268798828125, -2.09393310546875, -1.9190673828125, -1.74420166015625, -1.5693359375, -1.39447021484375, -1.2196044921875, -1.04473876953125, -0.869873046875, -0.69500732421875, -0.5201416015625, -0.34527587890625, -0.17041015625, 0.00445556640625, 0.1793212890625, 0.35418701171875, 0.529052734375, 0.70391845703125, 0.8787841796875, 1.05364990234375, 1.228515625, 1.40338134765625, 1.5782470703125, 1.75311279296875, 1.927978515625, 2.10284423828125, 2.2777099609375, 2.45257568359375, 2.62744140625, 2.80230712890625, 2.9771728515625, 3.15203857421875, 3.326904296875, 3.50177001953125, 3.6766357421875, 3.85150146484375, 4.0263671875, 4.20123291015625, 4.3760986328125, 4.55096435546875, 4.725830078125, 4.90069580078125, 5.0755615234375, 5.25042724609375, 5.42529296875, 5.60015869140625, 5.7750244140625, 5.94989013671875, 6.124755859375, 6.29962158203125, 6.4744873046875, 6.64935302734375, 6.82421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 11.0, 5.0, 7.0, 12.0, 17.0, 29.0, 33.0, 36.0, 50.0, 59.0, 69.0, 67.0, 61.0, 74.0, 69.0, 77.0, 74.0, 42.0, 52.0, 37.0, 35.0, 21.0, 22.0, 10.0, 8.0, 9.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58203125, -4.37982177734375, -4.1776123046875, -3.97540283203125, -3.773193359375, -3.57098388671875, -3.3687744140625, -3.16656494140625, -2.96435546875, -2.76214599609375, -2.5599365234375, -2.35772705078125, -2.155517578125, -1.95330810546875, -1.7510986328125, -1.54888916015625, -1.3466796875, -1.14447021484375, -0.9422607421875, -0.74005126953125, -0.537841796875, -0.33563232421875, -0.1334228515625, 0.06878662109375, 0.27099609375, 0.47320556640625, 0.6754150390625, 0.87762451171875, 1.079833984375, 1.28204345703125, 1.4842529296875, 1.68646240234375, 1.888671875, 2.09088134765625, 2.2930908203125, 2.49530029296875, 2.697509765625, 2.89971923828125, 3.1019287109375, 3.30413818359375, 3.50634765625, 3.70855712890625, 3.9107666015625, 4.11297607421875, 4.315185546875, 4.51739501953125, 4.7196044921875, 4.92181396484375, 5.1240234375, 5.32623291015625, 5.5284423828125, 5.73065185546875, 5.932861328125, 6.13507080078125, 6.3372802734375, 6.53948974609375, 6.74169921875, 6.94390869140625, 7.1461181640625, 7.34832763671875, 7.550537109375, 7.75274658203125, 7.9549560546875, 8.15716552734375, 8.359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 6.0, 7.0, 4.0, 9.0, 12.0, 17.0, 19.0, 27.0, 33.0, 39.0, 57.0, 85.0, 128.0, 255.0, 355.0, 605.0, 1156.0, 2320.0, 5225.0, 11909.0, 30165.0, 80080.0, 224041.0, 395073.0, 185511.0, 66349.0, 25654.0, 10298.0, 4445.0, 2129.0, 1044.0, 555.0, 306.0, 211.0, 127.0, 94.0, 62.0, 40.0, 23.0, 18.0, 12.0, 9.0, 7.0, 11.0, 6.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.58984375, -2.50738525390625, -2.4249267578125, -2.34246826171875, -2.260009765625, -2.17755126953125, -2.0950927734375, -2.01263427734375, -1.93017578125, -1.84771728515625, -1.7652587890625, -1.68280029296875, -1.600341796875, -1.51788330078125, -1.4354248046875, -1.35296630859375, -1.2705078125, -1.18804931640625, -1.1055908203125, -1.02313232421875, -0.940673828125, -0.85821533203125, -0.7757568359375, -0.69329833984375, -0.61083984375, -0.52838134765625, -0.4459228515625, -0.36346435546875, -0.281005859375, -0.19854736328125, -0.1160888671875, -0.03363037109375, 0.048828125, 0.13128662109375, 0.2137451171875, 0.29620361328125, 0.378662109375, 0.46112060546875, 0.5435791015625, 0.62603759765625, 0.70849609375, 0.79095458984375, 0.8734130859375, 0.95587158203125, 1.038330078125, 1.12078857421875, 1.2032470703125, 1.28570556640625, 1.3681640625, 1.45062255859375, 1.5330810546875, 1.61553955078125, 1.697998046875, 1.78045654296875, 1.8629150390625, 1.94537353515625, 2.02783203125, 2.11029052734375, 2.1927490234375, 2.27520751953125, 2.357666015625, 2.44012451171875, 2.5225830078125, 2.60504150390625, 2.6875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 10.0, 8.0, 7.0, 12.0, 17.0, 15.0, 19.0, 32.0, 31.0, 36.0, 32.0, 34.0, 37.0, 54.0, 52.0, 37.0, 41.0, 42.0, 42.0, 51.0, 42.0, 36.0, 31.0, 46.0, 25.0, 38.0, 25.0, 30.0, 29.0, 19.0, 10.0, 13.0, 16.0, 5.0, 5.0, 10.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.09991455078125, -8.8326416015625, -8.56536865234375, -8.298095703125, -8.03082275390625, -7.7635498046875, -7.49627685546875, -7.22900390625, -6.96173095703125, -6.6944580078125, -6.42718505859375, -6.159912109375, -5.89263916015625, -5.6253662109375, -5.35809326171875, -5.0908203125, -4.82354736328125, -4.5562744140625, -4.28900146484375, -4.021728515625, -3.75445556640625, -3.4871826171875, -3.21990966796875, -2.95263671875, -2.68536376953125, -2.4180908203125, -2.15081787109375, -1.883544921875, -1.61627197265625, -1.3489990234375, -1.08172607421875, -0.814453125, -0.54718017578125, -0.2799072265625, -0.01263427734375, 0.254638671875, 0.52191162109375, 0.7891845703125, 1.05645751953125, 1.32373046875, 1.59100341796875, 1.8582763671875, 2.12554931640625, 2.392822265625, 2.66009521484375, 2.9273681640625, 3.19464111328125, 3.4619140625, 3.72918701171875, 3.9964599609375, 4.26373291015625, 4.531005859375, 4.79827880859375, 5.0655517578125, 5.33282470703125, 5.60009765625, 5.86737060546875, 6.1346435546875, 6.40191650390625, 6.669189453125, 6.93646240234375, 7.2037353515625, 7.47100830078125, 7.73828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 10.0, 11.0, 20.0, 29.0, 45.0, 68.0, 93.0, 160.0, 265.0, 417.0, 702.0, 1250.0, 2263.0, 4556.0, 9536.0, 22130.0, 56731.0, 167781.0, 383536.0, 256296.0, 85720.0, 31425.0, 12818.0, 6028.0, 2907.0, 1562.0, 830.0, 496.0, 273.0, 200.0, 127.0, 90.0, 51.0, 36.0, 21.0, 20.0, 11.0, 9.0, 9.0, 3.0, 2.0, 0.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9052734375, -0.8775863647460938, -0.8498992919921875, -0.8222122192382812, -0.794525146484375, -0.7668380737304688, -0.7391510009765625, -0.7114639282226562, -0.68377685546875, -0.6560897827148438, -0.6284027099609375, -0.6007156372070312, -0.573028564453125, -0.5453414916992188, -0.5176544189453125, -0.48996734619140625, -0.4622802734375, -0.43459320068359375, -0.4069061279296875, -0.37921905517578125, -0.351531982421875, -0.32384490966796875, -0.2961578369140625, -0.26847076416015625, -0.24078369140625, -0.21309661865234375, -0.1854095458984375, -0.15772247314453125, -0.130035400390625, -0.10234832763671875, -0.0746612548828125, -0.04697418212890625, -0.019287109375, 0.00839996337890625, 0.0360870361328125, 0.06377410888671875, 0.091461181640625, 0.11914825439453125, 0.1468353271484375, 0.17452239990234375, 0.20220947265625, 0.22989654541015625, 0.2575836181640625, 0.28527069091796875, 0.312957763671875, 0.34064483642578125, 0.3683319091796875, 0.39601898193359375, 0.4237060546875, 0.45139312744140625, 0.4790802001953125, 0.5067672729492188, 0.534454345703125, 0.5621414184570312, 0.5898284912109375, 0.6175155639648438, 0.64520263671875, 0.6728897094726562, 0.7005767822265625, 0.7282638549804688, 0.755950927734375, 0.7836380004882812, 0.8113250732421875, 0.8390121459960938, 0.86669921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 0.0, 4.0, 4.0, 5.0, 3.0, 7.0, 11.0, 19.0, 26.0, 32.0, 41.0, 56.0, 62.0, 70.0, 110.0, 102.0, 90.0, 85.0, 71.0, 49.0, 30.0, 31.0, 28.0, 14.0, 17.0, 7.0, 2.0, 6.0, 9.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006198883056640625, -0.0006008297204971313, -0.0005817711353302002, -0.000562712550163269, -0.0005436539649963379, -0.0005245953798294067, -0.0005055367946624756, -0.00048647820949554443, -0.0004674196243286133, -0.00044836103916168213, -0.000429302453994751, -0.0004102438688278198, -0.00039118528366088867, -0.0003721266984939575, -0.00035306811332702637, -0.0003340095281600952, -0.00031495094299316406, -0.0002958923578262329, -0.00027683377265930176, -0.0002577751874923706, -0.00023871660232543945, -0.0002196580171585083, -0.00020059943199157715, -0.000181540846824646, -0.00016248226165771484, -0.0001434236764907837, -0.00012436509132385254, -0.00010530650615692139, -8.624792098999023e-05, -6.718933582305908e-05, -4.813075065612793e-05, -2.9072165489196777e-05, -1.0013580322265625e-05, 9.045004844665527e-06, 2.810359001159668e-05, 4.716217517852783e-05, 6.622076034545898e-05, 8.527934551239014e-05, 0.00010433793067932129, 0.00012339651584625244, 0.0001424551010131836, 0.00016151368618011475, 0.0001805722713470459, 0.00019963085651397705, 0.0002186894416809082, 0.00023774802684783936, 0.0002568066120147705, 0.00027586519718170166, 0.0002949237823486328, 0.00031398236751556396, 0.0003330409526824951, 0.00035209953784942627, 0.0003711581230163574, 0.0003902167081832886, 0.0004092752933502197, 0.0004283338785171509, 0.00044739246368408203, 0.0004664510488510132, 0.00048550963401794434, 0.0005045682191848755, 0.0005236268043518066, 0.0005426853895187378, 0.0005617439746856689, 0.0005808025598526001, 0.0005998611450195312]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 8.0, 12.0, 15.0, 15.0, 20.0, 18.0, 33.0, 62.0, 95.0, 182.0, 297.0, 564.0, 1449.0, 3790.0, 11856.0, 43934.0, 187987.0, 494666.0, 228760.0, 53286.0, 13983.0, 4433.0, 1553.0, 700.0, 309.0, 167.0, 96.0, 62.0, 32.0, 42.0, 34.0, 15.0, 19.0, 2.0, 5.0, 7.0, 3.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.232421875, -1.194580078125, -1.15673828125, -1.118896484375, -1.0810546875, -1.043212890625, -1.00537109375, -0.967529296875, -0.9296875, -0.891845703125, -0.85400390625, -0.816162109375, -0.7783203125, -0.740478515625, -0.70263671875, -0.664794921875, -0.626953125, -0.589111328125, -0.55126953125, -0.513427734375, -0.4755859375, -0.437744140625, -0.39990234375, -0.362060546875, -0.32421875, -0.286376953125, -0.24853515625, -0.210693359375, -0.1728515625, -0.135009765625, -0.09716796875, -0.059326171875, -0.021484375, 0.016357421875, 0.05419921875, 0.092041015625, 0.1298828125, 0.167724609375, 0.20556640625, 0.243408203125, 0.28125, 0.319091796875, 0.35693359375, 0.394775390625, 0.4326171875, 0.470458984375, 0.50830078125, 0.546142578125, 0.583984375, 0.621826171875, 0.65966796875, 0.697509765625, 0.7353515625, 0.773193359375, 0.81103515625, 0.848876953125, 0.88671875, 0.924560546875, 0.96240234375, 1.000244140625, 1.0380859375, 1.075927734375, 1.11376953125, 1.151611328125, 1.189453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 9.0, 4.0, 5.0, 11.0, 5.0, 12.0, 11.0, 19.0, 32.0, 29.0, 25.0, 40.0, 39.0, 43.0, 51.0, 62.0, 61.0, 74.0, 84.0, 71.0, 51.0, 49.0, 40.0, 36.0, 22.0, 26.0, 23.0, 14.0, 7.0, 8.0, 7.0, 8.0, 8.0, 8.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.2454833984375, -0.2384490966796875, -0.231414794921875, -0.2243804931640625, -0.21734619140625, -0.2103118896484375, -0.203277587890625, -0.1962432861328125, -0.189208984375, -0.1821746826171875, -0.175140380859375, -0.1681060791015625, -0.16107177734375, -0.1540374755859375, -0.147003173828125, -0.1399688720703125, -0.1329345703125, -0.1259002685546875, -0.118865966796875, -0.1118316650390625, -0.10479736328125, -0.0977630615234375, -0.090728759765625, -0.0836944580078125, -0.07666015625, -0.0696258544921875, -0.062591552734375, -0.0555572509765625, -0.04852294921875, -0.0414886474609375, -0.034454345703125, -0.0274200439453125, -0.0203857421875, -0.0133514404296875, -0.006317138671875, 0.0007171630859375, 0.00775146484375, 0.0147857666015625, 0.021820068359375, 0.0288543701171875, 0.035888671875, 0.0429229736328125, 0.049957275390625, 0.0569915771484375, 0.06402587890625, 0.0710601806640625, 0.078094482421875, 0.0851287841796875, 0.0921630859375, 0.0991973876953125, 0.106231689453125, 0.1132659912109375, 0.12030029296875, 0.1273345947265625, 0.134368896484375, 0.1414031982421875, 0.1484375, 0.1554718017578125, 0.162506103515625, 0.1695404052734375, 0.17657470703125, 0.1836090087890625, 0.190643310546875, 0.1976776123046875, 0.2047119140625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 10.0, 11.0, 14.0, 26.0, 38.0, 65.0, 103.0, 124.0, 130.0, 139.0, 107.0, 76.0, 52.0, 36.0, 23.0, 25.0, 6.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.971366882324219, -4.660595893859863, -4.349824905395508, -4.039053916931152, -3.728283166885376, -3.4175121784210205, -3.106741428375244, -2.7959704399108887, -2.485199451446533, -2.1744284629821777, -1.8636575937271118, -1.552886724472046, -1.2421157360076904, -0.931344747543335, -0.620573878288269, -0.3098030090332031, 0.0009679794311523438, 0.31173890829086304, 0.6225098371505737, 0.9332807660102844, 1.2440516948699951, 1.5548226833343506, 1.8655935525894165, 2.1763644218444824, 2.487135410308838, 2.7979063987731934, 3.108677387237549, 3.419448137283325, 3.7302191257476807, 4.040989875793457, 4.3517608642578125, 4.662531852722168, 4.973302841186523, 5.284073829650879, 5.594844818115234, 5.90561580657959, 6.216386795043945, 6.527157783508301, 6.837928295135498, 7.1486992835998535, 7.459470272064209, 7.7702412605285645, 8.081011772155762, 8.391782760620117, 8.702553749084473, 9.013324737548828, 9.324095726013184, 9.634866714477539, 9.945637702941895, 10.25640869140625, 10.567179679870605, 10.877950668334961, 11.188721656799316, 11.499492645263672, 11.810263633728027, 12.121034622192383, 12.431804656982422, 12.742575645446777, 13.053346633911133, 13.364117622375488, 13.674888610839844, 13.9856595993042, 14.296430587768555, 14.607200622558594, 14.917972564697266]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 8.0, 3.0, 7.0, 13.0, 18.0, 21.0, 25.0, 38.0, 55.0, 43.0, 46.0, 58.0, 66.0, 62.0, 74.0, 57.0, 71.0, 52.0, 51.0, 53.0, 40.0, 41.0, 19.0, 21.0, 14.0, 11.0, 6.0, 10.0, 1.0, 4.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71080207824707, -4.533476829528809, -4.356152057647705, -4.178826808929443, -4.00150203704834, -3.8241770267486572, -3.6468520164489746, -3.469526767730713, -3.2922019958496094, -3.1148769855499268, -2.937551975250244, -2.7602269649505615, -2.582901954650879, -2.4055769443511963, -2.2282519340515137, -2.050926685333252, -1.8736016750335693, -1.6962766647338867, -1.518951654434204, -1.3416266441345215, -1.1643016338348389, -0.9869765639305115, -0.8096514940261841, -0.6323264837265015, -0.45500147342681885, -0.27767646312713623, -0.10035142302513123, 0.07697361707687378, 0.2542986273765564, 0.431623637676239, 0.6089487075805664, 0.786273717880249, 0.9635987281799316, 1.1409237384796143, 1.3182487487792969, 1.4955737590789795, 1.672898769378662, 1.8502237796783447, 2.0275487899780273, 2.204874038696289, 2.3821988105773926, 2.559523820877075, 2.736848831176758, 2.9141738414764404, 3.091498851776123, 3.2688238620758057, 3.4461488723754883, 3.62347412109375, 3.8007991313934326, 3.9781241416931152, 4.155449390411377, 4.3327741622924805, 4.510099411010742, 4.687424182891846, 4.864749431610107, 5.042074203491211, 5.219399452209473, 5.396724700927734, 5.574049472808838, 5.7513747215271, 5.928699493408203, 6.106024742126465, 6.283349514007568, 6.46067476272583, 6.637999534606934]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 5.0, 4.0, 10.0, 16.0, 19.0, 26.0, 41.0, 70.0, 128.0, 231.0, 385.0, 639.0, 1260.0, 2465.0, 4933.0, 10348.0, 22996.0, 61482.0, 232337.0, 499731.0, 136399.0, 42056.0, 17089.0, 7727.0, 3781.0, 2000.0, 1079.0, 514.0, 309.0, 178.0, 110.0, 70.0, 30.0, 30.0, 25.0, 12.0, 6.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.03515625, -5.85931396484375, -5.6834716796875, -5.50762939453125, -5.331787109375, -5.15594482421875, -4.9801025390625, -4.80426025390625, -4.62841796875, -4.45257568359375, -4.2767333984375, -4.10089111328125, -3.925048828125, -3.74920654296875, -3.5733642578125, -3.39752197265625, -3.2216796875, -3.04583740234375, -2.8699951171875, -2.69415283203125, -2.518310546875, -2.34246826171875, -2.1666259765625, -1.99078369140625, -1.81494140625, -1.63909912109375, -1.4632568359375, -1.28741455078125, -1.111572265625, -0.93572998046875, -0.7598876953125, -0.58404541015625, -0.408203125, -0.23236083984375, -0.0565185546875, 0.11932373046875, 0.295166015625, 0.47100830078125, 0.6468505859375, 0.82269287109375, 0.99853515625, 1.17437744140625, 1.3502197265625, 1.52606201171875, 1.701904296875, 1.87774658203125, 2.0535888671875, 2.22943115234375, 2.4052734375, 2.58111572265625, 2.7569580078125, 2.93280029296875, 3.108642578125, 3.28448486328125, 3.4603271484375, 3.63616943359375, 3.81201171875, 3.98785400390625, 4.1636962890625, 4.33953857421875, 4.515380859375, 4.69122314453125, 4.8670654296875, 5.04290771484375, 5.21875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 15.0, 14.0, 22.0, 18.0, 36.0, 34.0, 57.0, 46.0, 49.0, 63.0, 59.0, 52.0, 68.0, 67.0, 69.0, 67.0, 36.0, 36.0, 37.0, 32.0, 25.0, 16.0, 16.0, 11.0, 8.0, 10.0, 5.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.2325439453125, -8.847900390625, -8.4632568359375, -8.07861328125, -7.6939697265625, -7.309326171875, -6.9246826171875, -6.5400390625, -6.1553955078125, -5.770751953125, -5.3861083984375, -5.00146484375, -4.6168212890625, -4.232177734375, -3.8475341796875, -3.462890625, -3.0782470703125, -2.693603515625, -2.3089599609375, -1.92431640625, -1.5396728515625, -1.155029296875, -0.7703857421875, -0.3857421875, -0.0010986328125, 0.383544921875, 0.7681884765625, 1.15283203125, 1.5374755859375, 1.922119140625, 2.3067626953125, 2.69140625, 3.0760498046875, 3.460693359375, 3.8453369140625, 4.22998046875, 4.6146240234375, 4.999267578125, 5.3839111328125, 5.7685546875, 6.1531982421875, 6.537841796875, 6.9224853515625, 7.30712890625, 7.6917724609375, 8.076416015625, 8.4610595703125, 8.845703125, 9.2303466796875, 9.614990234375, 9.9996337890625, 10.38427734375, 10.7689208984375, 11.153564453125, 11.5382080078125, 11.9228515625, 12.3074951171875, 12.692138671875, 13.0767822265625, 13.46142578125, 13.8460693359375, 14.230712890625, 14.6153564453125, 15.0]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 10.0, 7.0, 13.0, 7.0, 16.0, 15.0, 19.0, 21.0, 22.0, 29.0, 24.0, 25.0, 31.0, 51.0, 68.0, 155.0, 864.0, 22182.0, 975521.0, 47466.0, 1360.0, 176.0, 98.0, 49.0, 44.0, 47.0, 35.0, 22.0, 31.0, 24.0, 16.0, 22.0, 18.0, 8.0, 11.0, 8.0, 8.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.859375, -26.059814453125, -25.26025390625, -24.460693359375, -23.6611328125, -22.861572265625, -22.06201171875, -21.262451171875, -20.462890625, -19.663330078125, -18.86376953125, -18.064208984375, -17.2646484375, -16.465087890625, -15.66552734375, -14.865966796875, -14.06640625, -13.266845703125, -12.46728515625, -11.667724609375, -10.8681640625, -10.068603515625, -9.26904296875, -8.469482421875, -7.669921875, -6.870361328125, -6.07080078125, -5.271240234375, -4.4716796875, -3.672119140625, -2.87255859375, -2.072998046875, -1.2734375, -0.473876953125, 0.32568359375, 1.125244140625, 1.9248046875, 2.724365234375, 3.52392578125, 4.323486328125, 5.123046875, 5.922607421875, 6.72216796875, 7.521728515625, 8.3212890625, 9.120849609375, 9.92041015625, 10.719970703125, 11.51953125, 12.319091796875, 13.11865234375, 13.918212890625, 14.7177734375, 15.517333984375, 16.31689453125, 17.116455078125, 17.916015625, 18.715576171875, 19.51513671875, 20.314697265625, 21.1142578125, 21.913818359375, 22.71337890625, 23.512939453125, 24.3125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 6.0, 7.0, 12.0, 10.0, 12.0, 11.0, 17.0, 16.0, 21.0, 26.0, 14.0, 27.0, 30.0, 28.0, 29.0, 39.0, 34.0, 49.0, 39.0, 37.0, 44.0, 33.0, 41.0, 47.0, 44.0, 36.0, 35.0, 26.0, 26.0, 22.0, 32.0, 20.0, 27.0, 12.0, 9.0, 10.0, 12.0, 11.0, 14.0, 7.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.1328125, -7.8865966796875, -7.640380859375, -7.3941650390625, -7.14794921875, -6.9017333984375, -6.655517578125, -6.4093017578125, -6.1630859375, -5.9168701171875, -5.670654296875, -5.4244384765625, -5.17822265625, -4.9320068359375, -4.685791015625, -4.4395751953125, -4.193359375, -3.9471435546875, -3.700927734375, -3.4547119140625, -3.20849609375, -2.9622802734375, -2.716064453125, -2.4698486328125, -2.2236328125, -1.9774169921875, -1.731201171875, -1.4849853515625, -1.23876953125, -0.9925537109375, -0.746337890625, -0.5001220703125, -0.25390625, -0.0076904296875, 0.238525390625, 0.4847412109375, 0.73095703125, 0.9771728515625, 1.223388671875, 1.4696044921875, 1.7158203125, 1.9620361328125, 2.208251953125, 2.4544677734375, 2.70068359375, 2.9468994140625, 3.193115234375, 3.4393310546875, 3.685546875, 3.9317626953125, 4.177978515625, 4.4241943359375, 4.67041015625, 4.9166259765625, 5.162841796875, 5.4090576171875, 5.6552734375, 5.9014892578125, 6.147705078125, 6.3939208984375, 6.64013671875, 6.8863525390625, 7.132568359375, 7.3787841796875, 7.625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 10.0, 13.0, 24.0, 28.0, 29.0, 61.0, 117.0, 215.0, 418.0, 1076.0, 3160.0, 13506.0, 106128.0, 788108.0, 116060.0, 14167.0, 3367.0, 1128.0, 452.0, 192.0, 108.0, 57.0, 38.0, 25.0, 17.0, 11.0, 3.0, 9.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.143768310546875, -2.06292724609375, -1.982086181640625, -1.9012451171875, -1.820404052734375, -1.73956298828125, -1.658721923828125, -1.577880859375, -1.497039794921875, -1.41619873046875, -1.335357666015625, -1.2545166015625, -1.173675537109375, -1.09283447265625, -1.011993408203125, -0.93115234375, -0.850311279296875, -0.76947021484375, -0.688629150390625, -0.6077880859375, -0.526947021484375, -0.44610595703125, -0.365264892578125, -0.284423828125, -0.203582763671875, -0.12274169921875, -0.041900634765625, 0.0389404296875, 0.119781494140625, 0.20062255859375, 0.281463623046875, 0.3623046875, 0.443145751953125, 0.52398681640625, 0.604827880859375, 0.6856689453125, 0.766510009765625, 0.84735107421875, 0.928192138671875, 1.009033203125, 1.089874267578125, 1.17071533203125, 1.251556396484375, 1.3323974609375, 1.413238525390625, 1.49407958984375, 1.574920654296875, 1.65576171875, 1.736602783203125, 1.81744384765625, 1.898284912109375, 1.9791259765625, 2.059967041015625, 2.14080810546875, 2.221649169921875, 2.302490234375, 2.383331298828125, 2.46417236328125, 2.545013427734375, 2.6258544921875, 2.706695556640625, 2.78753662109375, 2.868377685546875, 2.94921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 1.0, 8.0, 6.0, 15.0, 22.0, 28.0, 62.0, 100.0, 124.0, 187.0, 162.0, 107.0, 60.0, 57.0, 27.0, 18.0, 11.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004611015319824219, -0.0004478655755519867, -0.0004346296191215515, -0.00042139366269111633, -0.00040815770626068115, -0.00039492174983024597, -0.0003816857933998108, -0.0003684498369693756, -0.00035521388053894043, -0.00034197792410850525, -0.00032874196767807007, -0.0003155060112476349, -0.0003022700548171997, -0.0002890340983867645, -0.00027579814195632935, -0.00026256218552589417, -0.000249326229095459, -0.0002360902726650238, -0.00022285431623458862, -0.00020961835980415344, -0.00019638240337371826, -0.00018314644694328308, -0.0001699104905128479, -0.00015667453408241272, -0.00014343857765197754, -0.00013020262122154236, -0.00011696666479110718, -0.000103730708360672, -9.049475193023682e-05, -7.725879549980164e-05, -6.402283906936646e-05, -5.0786882638931274e-05, -3.7550926208496094e-05, -2.4314969778060913e-05, -1.1079013347625732e-05, 2.1569430828094482e-06, 1.539289951324463e-05, 2.862885594367981e-05, 4.186481237411499e-05, 5.510076880455017e-05, 6.833672523498535e-05, 8.157268166542053e-05, 9.480863809585571e-05, 0.0001080445945262909, 0.00012128055095672607, 0.00013451650738716125, 0.00014775246381759644, 0.00016098842024803162, 0.0001742243766784668, 0.00018746033310890198, 0.00020069628953933716, 0.00021393224596977234, 0.00022716820240020752, 0.0002404041588306427, 0.0002536401152610779, 0.00026687607169151306, 0.00028011202812194824, 0.0002933479845523834, 0.0003065839409828186, 0.0003198198974132538, 0.00033305585384368896, 0.00034629181027412415, 0.0003595277667045593, 0.0003727637231349945, 0.0003859996795654297]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 6.0, 13.0, 19.0, 27.0, 40.0, 52.0, 95.0, 141.0, 190.0, 323.0, 604.0, 1094.0, 2138.0, 4440.0, 10182.0, 26103.0, 85699.0, 359817.0, 408312.0, 98805.0, 29405.0, 11074.0, 4884.0, 2296.0, 1147.0, 672.0, 360.0, 213.0, 135.0, 74.0, 47.0, 51.0, 26.0, 15.0, 9.0, 8.0, 8.0, 3.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1485137939453125, -1.107574462890625, -1.0666351318359375, -1.02569580078125, -0.9847564697265625, -0.943817138671875, -0.9028778076171875, -0.8619384765625, -0.8209991455078125, -0.780059814453125, -0.7391204833984375, -0.69818115234375, -0.6572418212890625, -0.616302490234375, -0.5753631591796875, -0.534423828125, -0.4934844970703125, -0.452545166015625, -0.4116058349609375, -0.37066650390625, -0.3297271728515625, -0.288787841796875, -0.2478485107421875, -0.2069091796875, -0.1659698486328125, -0.125030517578125, -0.0840911865234375, -0.04315185546875, -0.0022125244140625, 0.038726806640625, 0.0796661376953125, 0.12060546875, 0.1615447998046875, 0.202484130859375, 0.2434234619140625, 0.28436279296875, 0.3253021240234375, 0.366241455078125, 0.4071807861328125, 0.4481201171875, 0.4890594482421875, 0.529998779296875, 0.5709381103515625, 0.61187744140625, 0.6528167724609375, 0.693756103515625, 0.7346954345703125, 0.775634765625, 0.8165740966796875, 0.857513427734375, 0.8984527587890625, 0.93939208984375, 0.9803314208984375, 1.021270751953125, 1.0622100830078125, 1.1031494140625, 1.1440887451171875, 1.185028076171875, 1.2259674072265625, 1.26690673828125, 1.3078460693359375, 1.348785400390625, 1.3897247314453125, 1.4306640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 12.0, 15.0, 14.0, 12.0, 25.0, 30.0, 34.0, 48.0, 58.0, 72.0, 84.0, 81.0, 92.0, 84.0, 67.0, 49.0, 36.0, 37.0, 23.0, 13.0, 23.0, 12.0, 12.0, 9.0, 8.0, 4.0, 6.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7802734375, -0.7584304809570312, -0.7365875244140625, -0.7147445678710938, -0.692901611328125, -0.6710586547851562, -0.6492156982421875, -0.6273727416992188, -0.60552978515625, -0.5836868286132812, -0.5618438720703125, -0.5400009155273438, -0.518157958984375, -0.49631500244140625, -0.4744720458984375, -0.45262908935546875, -0.4307861328125, -0.40894317626953125, -0.3871002197265625, -0.36525726318359375, -0.343414306640625, -0.32157135009765625, -0.2997283935546875, -0.27788543701171875, -0.25604248046875, -0.23419952392578125, -0.2123565673828125, -0.19051361083984375, -0.168670654296875, -0.14682769775390625, -0.1249847412109375, -0.10314178466796875, -0.081298828125, -0.05945587158203125, -0.0376129150390625, -0.01576995849609375, 0.006072998046875, 0.02791595458984375, 0.0497589111328125, 0.07160186767578125, 0.09344482421875, 0.11528778076171875, 0.1371307373046875, 0.15897369384765625, 0.180816650390625, 0.20265960693359375, 0.2245025634765625, 0.24634552001953125, 0.2681884765625, 0.29003143310546875, 0.3118743896484375, 0.33371734619140625, 0.355560302734375, 0.37740325927734375, 0.3992462158203125, 0.42108917236328125, 0.44293212890625, 0.46477508544921875, 0.4866180419921875, 0.5084609985351562, 0.530303955078125, 0.5521469116210938, 0.5739898681640625, 0.5958328247070312, 0.61767578125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 21.0, 56.0, 127.0, 323.0, 284.0, 127.0, 45.0, 16.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.40650177001953, -75.82705688476562, -74.24761199951172, -72.66816711425781, -71.0887222290039, -69.50927734375, -67.9298324584961, -66.35038757324219, -64.77095031738281, -63.191505432128906, -61.612060546875, -60.032615661621094, -58.45317077636719, -56.87372970581055, -55.29428482055664, -53.714839935302734, -52.13539123535156, -50.555946350097656, -48.97650146484375, -47.397056579589844, -45.81761169433594, -44.2381706237793, -42.65872573852539, -41.079280853271484, -39.49983596801758, -37.92039108276367, -36.340946197509766, -34.76150131225586, -33.18206024169922, -31.60261344909668, -30.023170471191406, -28.4437255859375, -26.864280700683594, -25.284835815429688, -23.70539093017578, -22.125947952270508, -20.5465030670166, -18.967058181762695, -17.387615203857422, -15.808170318603516, -14.22872543334961, -12.649280548095703, -11.069836616516113, -9.490392684936523, -7.910947799682617, -6.331503391265869, -4.752058982849121, -3.1726150512695312, -1.593170166015625, -0.013725757598876953, 1.565718650817871, 3.145163059234619, 4.724607467651367, 6.304051876068115, 7.883496284484863, 9.462940216064453, 11.04238510131836, 12.621829986572266, 14.201273918151855, 15.780717849731445, 17.36016273498535, 18.939607620239258, 20.51905059814453, 22.098495483398438, 23.677940368652344]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 5.0, 8.0, 8.0, 11.0, 14.0, 24.0, 25.0, 21.0, 30.0, 36.0, 33.0, 32.0, 40.0, 40.0, 63.0, 36.0, 46.0, 43.0, 53.0, 48.0, 37.0, 40.0, 38.0, 34.0, 33.0, 27.0, 21.0, 22.0, 15.0, 20.0, 16.0, 16.0, 9.0, 9.0, 11.0, 4.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.492140769958496, -12.017292976379395, -11.542445182800293, -11.067597389221191, -10.592748641967773, -10.117900848388672, -9.64305305480957, -9.168205261230469, -8.693357467651367, -8.218509674072266, -7.743661880493164, -7.268813610076904, -6.793965816497803, -6.319118022918701, -5.844269752502441, -5.36942195892334, -4.894574165344238, -4.419726371765137, -3.944878339767456, -3.4700303077697754, -2.995182514190674, -2.5203347206115723, -2.0454866886138916, -1.570638656616211, -1.0957908630371094, -0.6209429502487183, -0.14609503746032715, 0.32875287532806396, 0.8036007881164551, 1.2784485816955566, 1.7532966136932373, 2.228144645690918, 2.702991485595703, 3.1778392791748047, 3.6526873111724854, 4.127535343170166, 4.602383136749268, 5.077230930328369, 5.552079200744629, 6.0269269943237305, 6.501774787902832, 6.976622581481934, 7.451470375061035, 7.926318645477295, 8.401166915893555, 8.876014709472656, 9.350862503051758, 9.82571029663086, 10.300558090209961, 10.775405883789062, 11.250253677368164, 11.725101470947266, 12.199949264526367, 12.674797058105469, 13.149645805358887, 13.624493598937988, 14.09934139251709, 14.574189186096191, 15.049036979675293, 15.523884773254395, 15.998733520507812, 16.473581314086914, 16.948429107666016, 17.423276901245117, 17.89812469482422]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 10.0, 16.0, 20.0, 36.0, 42.0, 72.0, 123.0, 203.0, 289.0, 505.0, 918.0, 1544.0, 3225.0, 7418.0, 20535.0, 79699.0, 509986.0, 2501218.0, 903084.0, 120599.0, 27382.0, 9045.0, 3914.0, 1892.0, 972.0, 549.0, 315.0, 218.0, 128.0, 106.0, 65.0, 37.0, 23.0, 22.0, 22.0, 9.0, 3.0, 9.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.89453125, -7.62811279296875, -7.3616943359375, -7.09527587890625, -6.828857421875, -6.56243896484375, -6.2960205078125, -6.02960205078125, -5.76318359375, -5.49676513671875, -5.2303466796875, -4.96392822265625, -4.697509765625, -4.43109130859375, -4.1646728515625, -3.89825439453125, -3.6318359375, -3.36541748046875, -3.0989990234375, -2.83258056640625, -2.566162109375, -2.29974365234375, -2.0333251953125, -1.76690673828125, -1.50048828125, -1.23406982421875, -0.9676513671875, -0.70123291015625, -0.434814453125, -0.16839599609375, 0.0980224609375, 0.36444091796875, 0.630859375, 0.89727783203125, 1.1636962890625, 1.43011474609375, 1.696533203125, 1.96295166015625, 2.2293701171875, 2.49578857421875, 2.76220703125, 3.02862548828125, 3.2950439453125, 3.56146240234375, 3.827880859375, 4.09429931640625, 4.3607177734375, 4.62713623046875, 4.8935546875, 5.15997314453125, 5.4263916015625, 5.69281005859375, 5.959228515625, 6.22564697265625, 6.4920654296875, 6.75848388671875, 7.02490234375, 7.29132080078125, 7.5577392578125, 7.82415771484375, 8.090576171875, 8.35699462890625, 8.6234130859375, 8.88983154296875, 9.15625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 8.0, 3.0, 6.0, 5.0, 6.0, 7.0, 12.0, 14.0, 22.0, 22.0, 26.0, 32.0, 42.0, 43.0, 49.0, 40.0, 59.0, 57.0, 58.0, 58.0, 54.0, 66.0, 55.0, 40.0, 34.0, 42.0, 26.0, 18.0, 23.0, 11.0, 13.0, 20.0, 9.0, 9.0, 4.0, 7.0, 2.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.70294189453125, -6.4996337890625, -6.29632568359375, -6.093017578125, -5.88970947265625, -5.6864013671875, -5.48309326171875, -5.27978515625, -5.07647705078125, -4.8731689453125, -4.66986083984375, -4.466552734375, -4.26324462890625, -4.0599365234375, -3.85662841796875, -3.6533203125, -3.45001220703125, -3.2467041015625, -3.04339599609375, -2.840087890625, -2.63677978515625, -2.4334716796875, -2.23016357421875, -2.02685546875, -1.82354736328125, -1.6202392578125, -1.41693115234375, -1.213623046875, -1.01031494140625, -0.8070068359375, -0.60369873046875, -0.400390625, -0.19708251953125, 0.0062255859375, 0.20953369140625, 0.412841796875, 0.61614990234375, 0.8194580078125, 1.02276611328125, 1.22607421875, 1.42938232421875, 1.6326904296875, 1.83599853515625, 2.039306640625, 2.24261474609375, 2.4459228515625, 2.64923095703125, 2.8525390625, 3.05584716796875, 3.2591552734375, 3.46246337890625, 3.665771484375, 3.86907958984375, 4.0723876953125, 4.27569580078125, 4.47900390625, 4.68231201171875, 4.8856201171875, 5.08892822265625, 5.292236328125, 5.49554443359375, 5.6988525390625, 5.90216064453125, 6.10546875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 13.0, 12.0, 32.0, 40.0, 61.0, 98.0, 158.0, 337.0, 1360.0, 12796.0, 2614336.0, 1552172.0, 10860.0, 1222.0, 303.0, 171.0, 95.0, 68.0, 44.0, 28.0, 21.0, 14.0, 8.0, 5.0, 3.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.3125, -16.5244140625, -15.736328125, -14.9482421875, -14.16015625, -13.3720703125, -12.583984375, -11.7958984375, -11.0078125, -10.2197265625, -9.431640625, -8.6435546875, -7.85546875, -7.0673828125, -6.279296875, -5.4912109375, -4.703125, -3.9150390625, -3.126953125, -2.3388671875, -1.55078125, -0.7626953125, 0.025390625, 0.8134765625, 1.6015625, 2.3896484375, 3.177734375, 3.9658203125, 4.75390625, 5.5419921875, 6.330078125, 7.1181640625, 7.90625, 8.6943359375, 9.482421875, 10.2705078125, 11.05859375, 11.8466796875, 12.634765625, 13.4228515625, 14.2109375, 14.9990234375, 15.787109375, 16.5751953125, 17.36328125, 18.1513671875, 18.939453125, 19.7275390625, 20.515625, 21.3037109375, 22.091796875, 22.8798828125, 23.66796875, 24.4560546875, 25.244140625, 26.0322265625, 26.8203125, 27.6083984375, 28.396484375, 29.1845703125, 29.97265625, 30.7607421875, 31.548828125, 32.3369140625, 33.125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 10.0, 12.0, 20.0, 21.0, 37.0, 64.0, 88.0, 135.0, 251.0, 449.0, 771.0, 935.0, 575.0, 279.0, 150.0, 98.0, 62.0, 41.0, 25.0, 16.0, 14.0, 11.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5, -4.38525390625, -4.2705078125, -4.15576171875, -4.041015625, -3.92626953125, -3.8115234375, -3.69677734375, -3.58203125, -3.46728515625, -3.3525390625, -3.23779296875, -3.123046875, -3.00830078125, -2.8935546875, -2.77880859375, -2.6640625, -2.54931640625, -2.4345703125, -2.31982421875, -2.205078125, -2.09033203125, -1.9755859375, -1.86083984375, -1.74609375, -1.63134765625, -1.5166015625, -1.40185546875, -1.287109375, -1.17236328125, -1.0576171875, -0.94287109375, -0.828125, -0.71337890625, -0.5986328125, -0.48388671875, -0.369140625, -0.25439453125, -0.1396484375, -0.02490234375, 0.08984375, 0.20458984375, 0.3193359375, 0.43408203125, 0.548828125, 0.66357421875, 0.7783203125, 0.89306640625, 1.0078125, 1.12255859375, 1.2373046875, 1.35205078125, 1.466796875, 1.58154296875, 1.6962890625, 1.81103515625, 1.92578125, 2.04052734375, 2.1552734375, 2.27001953125, 2.384765625, 2.49951171875, 2.6142578125, 2.72900390625, 2.84375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 6.0, 14.0, 21.0, 37.0, 42.0, 59.0, 86.0, 102.0, 143.0, 115.0, 101.0, 92.0, 57.0, 31.0, 26.0, 26.0, 15.0, 6.0, 5.0, 5.0, 1.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.095888137817383, -7.672084331512451, -7.2482805252075195, -6.824477195739746, -6.4006733894348145, -5.976869583129883, -5.553066253662109, -5.129262447357178, -4.705458641052246, -4.2816548347473145, -3.857851266860962, -3.4340476989746094, -3.0102438926696777, -2.586440086364746, -2.1626365184783936, -1.738832950592041, -1.3150291442871094, -0.8912254571914673, -0.4674217700958252, -0.043618083000183105, 0.380185604095459, 0.8039894104003906, 1.2277929782867432, 1.6515965461730957, 2.0754003524780273, 2.499204158782959, 2.9230077266693115, 3.346811294555664, 3.7706151008605957, 4.194418907165527, 4.618222236633301, 5.042026042938232, 5.465829849243164, 5.889633655548096, 6.313437461853027, 6.737240791320801, 7.161044597625732, 7.584848403930664, 8.008651733398438, 8.432455062866211, 8.8562593460083, 9.280062675476074, 9.703866958618164, 10.127670288085938, 10.551473617553711, 10.9752779006958, 11.399081230163574, 11.822885513305664, 12.246688842773438, 12.670492172241211, 13.0942964553833, 13.518099784851074, 13.941904067993164, 14.365707397460938, 14.789510726928711, 15.213314056396484, 15.637118339538574, 16.060922622680664, 16.484725952148438, 16.90852928161621, 17.332332611083984, 17.75613784790039, 18.179941177368164, 18.603744506835938, 19.02754783630371]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 7.0, 17.0, 10.0, 22.0, 19.0, 34.0, 35.0, 41.0, 37.0, 31.0, 56.0, 70.0, 54.0, 62.0, 70.0, 65.0, 57.0, 52.0, 48.0, 34.0, 41.0, 28.0, 24.0, 20.0, 11.0, 17.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.007919311523438, -7.742435455322266, -7.476951599121094, -7.211467266082764, -6.945983409881592, -6.68049955368042, -6.41501522064209, -6.149531364440918, -5.884047508239746, -5.618563652038574, -5.353079795837402, -5.087595462799072, -4.8221116065979, -4.5566277503967285, -4.291143417358398, -4.025659561157227, -3.7601757049560547, -3.494691848754883, -3.229207754135132, -2.963723659515381, -2.698239803314209, -2.432755947113037, -2.167271852493286, -1.9017878770828247, -1.6363039016723633, -1.3708199262619019, -1.1053359508514404, -0.839851975440979, -0.5743680000305176, -0.30888402462005615, -0.04340004920959473, 0.2220839262008667, 0.4875679016113281, 0.7530518770217896, 1.018535852432251, 1.2840198278427124, 1.5495038032531738, 1.8149877786636353, 2.0804717540740967, 2.3459558486938477, 2.6114397048950195, 2.8769235610961914, 3.1424076557159424, 3.4078917503356934, 3.6733756065368652, 3.938859462738037, 4.204343795776367, 4.469827651977539, 4.735311508178711, 5.000795364379883, 5.266279220581055, 5.531763553619385, 5.797247409820557, 6.0627312660217285, 6.328215599060059, 6.5936994552612305, 6.859183311462402, 7.124667167663574, 7.390151023864746, 7.655635356903076, 7.921119213104248, 8.186603546142578, 8.45208740234375, 8.717571258544922, 8.983055114746094]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 15.0, 12.0, 22.0, 35.0, 39.0, 48.0, 98.0, 179.0, 291.0, 570.0, 1154.0, 2525.0, 5871.0, 14737.0, 39874.0, 119622.0, 390008.0, 324123.0, 95431.0, 32272.0, 12361.0, 4962.0, 2137.0, 982.0, 519.0, 257.0, 156.0, 69.0, 56.0, 35.0, 27.0, 20.0, 11.0, 9.0, 6.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.164337158203125, -2.09429931640625, -2.024261474609375, -1.9542236328125, -1.884185791015625, -1.81414794921875, -1.744110107421875, -1.674072265625, -1.604034423828125, -1.53399658203125, -1.463958740234375, -1.3939208984375, -1.323883056640625, -1.25384521484375, -1.183807373046875, -1.11376953125, -1.043731689453125, -0.97369384765625, -0.903656005859375, -0.8336181640625, -0.763580322265625, -0.69354248046875, -0.623504638671875, -0.553466796875, -0.483428955078125, -0.41339111328125, -0.343353271484375, -0.2733154296875, -0.203277587890625, -0.13323974609375, -0.063201904296875, 0.0068359375, 0.076873779296875, 0.14691162109375, 0.216949462890625, 0.2869873046875, 0.357025146484375, 0.42706298828125, 0.497100830078125, 0.567138671875, 0.637176513671875, 0.70721435546875, 0.777252197265625, 0.8472900390625, 0.917327880859375, 0.98736572265625, 1.057403564453125, 1.12744140625, 1.197479248046875, 1.26751708984375, 1.337554931640625, 1.4075927734375, 1.477630615234375, 1.54766845703125, 1.617706298828125, 1.687744140625, 1.757781982421875, 1.82781982421875, 1.897857666015625, 1.9678955078125, 2.037933349609375, 2.10797119140625, 2.178009033203125, 2.248046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 10.0, 12.0, 21.0, 17.0, 34.0, 39.0, 45.0, 47.0, 59.0, 69.0, 66.0, 68.0, 80.0, 77.0, 68.0, 59.0, 41.0, 39.0, 38.0, 28.0, 17.0, 14.0, 12.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -4.988525390625, -4.79736328125, -4.606201171875, -4.4150390625, -4.223876953125, -4.03271484375, -3.841552734375, -3.650390625, -3.459228515625, -3.26806640625, -3.076904296875, -2.8857421875, -2.694580078125, -2.50341796875, -2.312255859375, -2.12109375, -1.929931640625, -1.73876953125, -1.547607421875, -1.3564453125, -1.165283203125, -0.97412109375, -0.782958984375, -0.591796875, -0.400634765625, -0.20947265625, -0.018310546875, 0.1728515625, 0.364013671875, 0.55517578125, 0.746337890625, 0.9375, 1.128662109375, 1.31982421875, 1.510986328125, 1.7021484375, 1.893310546875, 2.08447265625, 2.275634765625, 2.466796875, 2.657958984375, 2.84912109375, 3.040283203125, 3.2314453125, 3.422607421875, 3.61376953125, 3.804931640625, 3.99609375, 4.187255859375, 4.37841796875, 4.569580078125, 4.7607421875, 4.951904296875, 5.14306640625, 5.334228515625, 5.525390625, 5.716552734375, 5.90771484375, 6.098876953125, 6.2900390625, 6.481201171875, 6.67236328125, 6.863525390625, 7.0546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 8.0, 11.0, 23.0, 24.0, 25.0, 48.0, 71.0, 84.0, 187.0, 270.0, 505.0, 870.0, 1702.0, 3428.0, 7916.0, 19458.0, 52118.0, 156363.0, 396942.0, 268557.0, 86461.0, 30743.0, 12315.0, 5312.0, 2339.0, 1173.0, 619.0, 339.0, 242.0, 132.0, 85.0, 63.0, 36.0, 22.0, 27.0, 10.0, 8.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8203125, -1.7610931396484375, -1.701873779296875, -1.6426544189453125, -1.58343505859375, -1.5242156982421875, -1.464996337890625, -1.4057769775390625, -1.3465576171875, -1.2873382568359375, -1.228118896484375, -1.1688995361328125, -1.10968017578125, -1.0504608154296875, -0.991241455078125, -0.9320220947265625, -0.872802734375, -0.8135833740234375, -0.754364013671875, -0.6951446533203125, -0.63592529296875, -0.5767059326171875, -0.517486572265625, -0.4582672119140625, -0.3990478515625, -0.3398284912109375, -0.280609130859375, -0.2213897705078125, -0.16217041015625, -0.1029510498046875, -0.043731689453125, 0.0154876708984375, 0.07470703125, 0.1339263916015625, 0.193145751953125, 0.2523651123046875, 0.31158447265625, 0.3708038330078125, 0.430023193359375, 0.4892425537109375, 0.5484619140625, 0.6076812744140625, 0.666900634765625, 0.7261199951171875, 0.78533935546875, 0.8445587158203125, 0.903778076171875, 0.9629974365234375, 1.022216796875, 1.0814361572265625, 1.140655517578125, 1.1998748779296875, 1.25909423828125, 1.3183135986328125, 1.377532958984375, 1.4367523193359375, 1.4959716796875, 1.5551910400390625, 1.614410400390625, 1.6736297607421875, 1.73284912109375, 1.7920684814453125, 1.851287841796875, 1.9105072021484375, 1.9697265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 10.0, 7.0, 5.0, 11.0, 9.0, 8.0, 14.0, 14.0, 31.0, 24.0, 30.0, 33.0, 36.0, 30.0, 41.0, 39.0, 43.0, 42.0, 34.0, 44.0, 56.0, 52.0, 52.0, 46.0, 35.0, 27.0, 34.0, 33.0, 23.0, 27.0, 19.0, 13.0, 19.0, 7.0, 6.0, 9.0, 5.0, 5.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.3984375, -8.14532470703125, -7.8922119140625, -7.63909912109375, -7.385986328125, -7.13287353515625, -6.8797607421875, -6.62664794921875, -6.37353515625, -6.12042236328125, -5.8673095703125, -5.61419677734375, -5.361083984375, -5.10797119140625, -4.8548583984375, -4.60174560546875, -4.3486328125, -4.09552001953125, -3.8424072265625, -3.58929443359375, -3.336181640625, -3.08306884765625, -2.8299560546875, -2.57684326171875, -2.32373046875, -2.07061767578125, -1.8175048828125, -1.56439208984375, -1.311279296875, -1.05816650390625, -0.8050537109375, -0.55194091796875, -0.298828125, -0.04571533203125, 0.2073974609375, 0.46051025390625, 0.713623046875, 0.96673583984375, 1.2198486328125, 1.47296142578125, 1.72607421875, 1.97918701171875, 2.2322998046875, 2.48541259765625, 2.738525390625, 2.99163818359375, 3.2447509765625, 3.49786376953125, 3.7509765625, 4.00408935546875, 4.2572021484375, 4.51031494140625, 4.763427734375, 5.01654052734375, 5.2696533203125, 5.52276611328125, 5.77587890625, 6.02899169921875, 6.2821044921875, 6.53521728515625, 6.788330078125, 7.04144287109375, 7.2945556640625, 7.54766845703125, 7.80078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 5.0, 7.0, 8.0, 11.0, 26.0, 36.0, 82.0, 125.0, 238.0, 529.0, 1209.0, 3251.0, 10640.0, 46930.0, 315730.0, 545301.0, 97980.0, 18297.0, 5008.0, 1716.0, 745.0, 312.0, 163.0, 80.0, 49.0, 22.0, 17.0, 13.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.1403656005859375, -1.104949951171875, -1.0695343017578125, -1.03411865234375, -0.9987030029296875, -0.963287353515625, -0.9278717041015625, -0.8924560546875, -0.8570404052734375, -0.821624755859375, -0.7862091064453125, -0.75079345703125, -0.7153778076171875, -0.679962158203125, -0.6445465087890625, -0.609130859375, -0.5737152099609375, -0.538299560546875, -0.5028839111328125, -0.46746826171875, -0.4320526123046875, -0.396636962890625, -0.3612213134765625, -0.3258056640625, -0.2903900146484375, -0.254974365234375, -0.2195587158203125, -0.18414306640625, -0.1487274169921875, -0.113311767578125, -0.0778961181640625, -0.04248046875, -0.0070648193359375, 0.028350830078125, 0.0637664794921875, 0.09918212890625, 0.1345977783203125, 0.170013427734375, 0.2054290771484375, 0.2408447265625, 0.2762603759765625, 0.311676025390625, 0.3470916748046875, 0.38250732421875, 0.4179229736328125, 0.453338623046875, 0.4887542724609375, 0.524169921875, 0.5595855712890625, 0.595001220703125, 0.6304168701171875, 0.66583251953125, 0.7012481689453125, 0.736663818359375, 0.7720794677734375, 0.8074951171875, 0.8429107666015625, 0.878326416015625, 0.9137420654296875, 0.94915771484375, 0.9845733642578125, 1.019989013671875, 1.0554046630859375, 1.0908203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 7.0, 8.0, 13.0, 15.0, 20.0, 27.0, 30.0, 35.0, 41.0, 59.0, 63.0, 69.0, 66.0, 80.0, 59.0, 66.0, 48.0, 63.0, 46.0, 24.0, 33.0, 22.0, 17.0, 10.0, 9.0, 9.0, 7.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003364086151123047, -0.0003260299563407898, -0.0003156512975692749, -0.00030527263879776, -0.0002948939800262451, -0.0002845153212547302, -0.00027413666248321533, -0.00026375800371170044, -0.00025337934494018555, -0.00024300068616867065, -0.00023262202739715576, -0.00022224336862564087, -0.00021186470985412598, -0.00020148605108261108, -0.0001911073923110962, -0.0001807287335395813, -0.0001703500747680664, -0.00015997141599655151, -0.00014959275722503662, -0.00013921409845352173, -0.00012883543968200684, -0.00011845678091049194, -0.00010807812213897705, -9.769946336746216e-05, -8.732080459594727e-05, -7.694214582443237e-05, -6.656348705291748e-05, -5.618482828140259e-05, -4.5806169509887695e-05, -3.54275107383728e-05, -2.504885196685791e-05, -1.4670193195343018e-05, -4.291534423828125e-06, 6.087124347686768e-06, 1.646578311920166e-05, 2.6844441890716553e-05, 3.7223100662231445e-05, 4.760175943374634e-05, 5.798041820526123e-05, 6.835907697677612e-05, 7.873773574829102e-05, 8.911639451980591e-05, 9.94950532913208e-05, 0.0001098737120628357, 0.00012025237083435059, 0.00013063102960586548, 0.00014100968837738037, 0.00015138834714889526, 0.00016176700592041016, 0.00017214566469192505, 0.00018252432346343994, 0.00019290298223495483, 0.00020328164100646973, 0.00021366029977798462, 0.0002240389585494995, 0.0002344176173210144, 0.0002447962760925293, 0.0002551749348640442, 0.0002655535936355591, 0.000275932252407074, 0.00028631091117858887, 0.00029668956995010376, 0.00030706822872161865, 0.00031744688749313354, 0.00032782554626464844]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 13.0, 14.0, 16.0, 23.0, 33.0, 57.0, 117.0, 224.0, 501.0, 1394.0, 4340.0, 16387.0, 87127.0, 485567.0, 372936.0, 61461.0, 12617.0, 3564.0, 1184.0, 463.0, 214.0, 123.0, 66.0, 23.0, 18.0, 22.0, 12.0, 6.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2431640625, -1.20947265625, -1.17578125, -1.14208984375, -1.1083984375, -1.07470703125, -1.041015625, -1.00732421875, -0.9736328125, -0.93994140625, -0.90625, -0.87255859375, -0.8388671875, -0.80517578125, -0.771484375, -0.73779296875, -0.7041015625, -0.67041015625, -0.63671875, -0.60302734375, -0.5693359375, -0.53564453125, -0.501953125, -0.46826171875, -0.4345703125, -0.40087890625, -0.3671875, -0.33349609375, -0.2998046875, -0.26611328125, -0.232421875, -0.19873046875, -0.1650390625, -0.13134765625, -0.09765625, -0.06396484375, -0.0302734375, 0.00341796875, 0.037109375, 0.07080078125, 0.1044921875, 0.13818359375, 0.171875, 0.20556640625, 0.2392578125, 0.27294921875, 0.306640625, 0.34033203125, 0.3740234375, 0.40771484375, 0.44140625, 0.47509765625, 0.5087890625, 0.54248046875, 0.576171875, 0.60986328125, 0.6435546875, 0.67724609375, 0.7109375, 0.74462890625, 0.7783203125, 0.81201171875, 0.845703125, 0.87939453125, 0.9130859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 4.0, 10.0, 17.0, 15.0, 13.0, 20.0, 31.0, 53.0, 52.0, 55.0, 70.0, 61.0, 64.0, 53.0, 70.0, 69.0, 65.0, 50.0, 32.0, 32.0, 28.0, 20.0, 18.0, 18.0, 12.0, 14.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1510009765625, -0.14468955993652344, -0.13837814331054688, -0.1320667266845703, -0.12575531005859375, -0.11944389343261719, -0.11313247680664062, -0.10682106018066406, -0.1005096435546875, -0.09419822692871094, -0.08788681030273438, -0.08157539367675781, -0.07526397705078125, -0.06895256042480469, -0.06264114379882812, -0.05632972717285156, -0.050018310546875, -0.04370689392089844, -0.037395477294921875, -0.031084060668945312, -0.02477264404296875, -0.018461227416992188, -0.012149810791015625, -0.0058383941650390625, 0.0004730224609375, 0.0067844390869140625, 0.013095855712890625, 0.019407272338867188, 0.02571868896484375, 0.03203010559082031, 0.038341522216796875, 0.04465293884277344, 0.05096435546875, 0.05727577209472656, 0.06358718872070312, 0.06989860534667969, 0.07621002197265625, 0.08252143859863281, 0.08883285522460938, 0.09514427185058594, 0.1014556884765625, 0.10776710510253906, 0.11407852172851562, 0.12038993835449219, 0.12670135498046875, 0.1330127716064453, 0.13932418823242188, 0.14563560485839844, 0.151947021484375, 0.15825843811035156, 0.16456985473632812, 0.1708812713623047, 0.17719268798828125, 0.1835041046142578, 0.18981552124023438, 0.19612693786621094, 0.2024383544921875, 0.20874977111816406, 0.21506118774414062, 0.2213726043701172, 0.22768402099609375, 0.2339954376220703, 0.24030685424804688, 0.24661827087402344, 0.2529296875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 8.0, 17.0, 12.0, 36.0, 46.0, 86.0, 123.0, 156.0, 174.0, 134.0, 81.0, 46.0, 37.0, 19.0, 9.0, 8.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.988353252410889, -4.659221172332764, -4.330089092254639, -4.000957012176514, -3.6718246936798096, -3.3426926136016846, -3.0135602951049805, -2.6844282150268555, -2.3552961349487305, -2.0261640548706055, -1.697031855583191, -1.3678996562957764, -1.0387675762176514, -0.7096354961395264, -0.3805032968521118, -0.051371097564697266, 0.27776098251342773, 0.6068931221961975, 0.9360252618789673, 1.2651574611663818, 1.5942895412445068, 1.9234216213226318, 2.252553939819336, 2.581686019897461, 2.910818099975586, 3.239950180053711, 3.569082260131836, 3.89821457862854, 4.227346420288086, 4.556478500366211, 4.885611057281494, 5.214743137359619, 5.543874740600586, 5.873006820678711, 6.202138900756836, 6.531270980834961, 6.860403060913086, 7.189535140991211, 7.518667697906494, 7.847799777984619, 8.176931381225586, 8.506063461303711, 8.835195541381836, 9.164327621459961, 9.493459701538086, 9.822591781616211, 10.151723861694336, 10.480855941772461, 10.809988975524902, 11.139121055603027, 11.468253135681152, 11.797385215759277, 12.126517295837402, 12.455649375915527, 12.784781455993652, 13.113914489746094, 13.443046569824219, 13.772178649902344, 14.101310729980469, 14.430442810058594, 14.759574890136719, 15.088706970214844, 15.417839050292969, 15.746971130371094, 16.07610321044922]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 5.0, 11.0, 22.0, 14.0, 30.0, 35.0, 47.0, 34.0, 52.0, 73.0, 72.0, 68.0, 78.0, 79.0, 69.0, 65.0, 51.0, 34.0, 33.0, 31.0, 20.0, 18.0, 18.0, 11.0, 9.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.821997165679932, -4.639649391174316, -4.457301616668701, -4.274953842163086, -4.092606067657471, -3.9102582931518555, -3.727910280227661, -3.545562505722046, -3.3632147312164307, -3.1808669567108154, -2.9985191822052, -2.816171169281006, -2.6338233947753906, -2.4514756202697754, -2.26912784576416, -2.086780071258545, -1.9044322967529297, -1.7220845222473145, -1.5397367477416992, -1.3573888540267944, -1.1750410795211792, -0.992693305015564, -0.8103454113006592, -0.627997636795044, -0.4456498622894287, -0.2633020579814911, -0.08095425367355347, 0.10139358043670654, 0.2837413549423218, 0.466089129447937, 0.6484370231628418, 0.830784797668457, 1.013132095336914, 1.1954798698425293, 1.3778276443481445, 1.5601755380630493, 1.7425233125686646, 1.9248710870742798, 2.1072189807891846, 2.2895667552948, 2.471914529800415, 2.6542623043060303, 2.8366100788116455, 3.01895809173584, 3.201305866241455, 3.3836536407470703, 3.5660014152526855, 3.748349189758301, 3.930696964263916, 4.113044738769531, 4.2953925132751465, 4.477740287780762, 4.660088062286377, 4.842435836791992, 5.024784088134766, 5.207131385803223, 5.389479637145996, 5.571827411651611, 5.754175186157227, 5.936522960662842, 6.118870735168457, 6.301218509674072, 6.4835662841796875, 6.665914535522461, 6.848261833190918]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 6.0, 5.0, 5.0, 12.0, 10.0, 10.0, 14.0, 38.0, 37.0, 70.0, 189.0, 625.0, 2711.0, 18816.0, 242512.0, 723554.0, 52028.0, 6149.0, 1173.0, 298.0, 105.0, 57.0, 39.0, 22.0, 16.0, 12.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.3125, -10.98193359375, -10.6513671875, -10.32080078125, -9.990234375, -9.65966796875, -9.3291015625, -8.99853515625, -8.66796875, -8.33740234375, -8.0068359375, -7.67626953125, -7.345703125, -7.01513671875, -6.6845703125, -6.35400390625, -6.0234375, -5.69287109375, -5.3623046875, -5.03173828125, -4.701171875, -4.37060546875, -4.0400390625, -3.70947265625, -3.37890625, -3.04833984375, -2.7177734375, -2.38720703125, -2.056640625, -1.72607421875, -1.3955078125, -1.06494140625, -0.734375, -0.40380859375, -0.0732421875, 0.25732421875, 0.587890625, 0.91845703125, 1.2490234375, 1.57958984375, 1.91015625, 2.24072265625, 2.5712890625, 2.90185546875, 3.232421875, 3.56298828125, 3.8935546875, 4.22412109375, 4.5546875, 4.88525390625, 5.2158203125, 5.54638671875, 5.876953125, 6.20751953125, 6.5380859375, 6.86865234375, 7.19921875, 7.52978515625, 7.8603515625, 8.19091796875, 8.521484375, 8.85205078125, 9.1826171875, 9.51318359375, 9.84375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 6.0, 10.0, 9.0, 7.0, 17.0, 24.0, 26.0, 34.0, 38.0, 54.0, 57.0, 63.0, 76.0, 61.0, 67.0, 69.0, 65.0, 65.0, 46.0, 45.0, 29.0, 29.0, 20.0, 17.0, 20.0, 11.0, 4.0, 4.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.4603271484375, -8.076904296875, -7.6934814453125, -7.31005859375, -6.9266357421875, -6.543212890625, -6.1597900390625, -5.7763671875, -5.3929443359375, -5.009521484375, -4.6260986328125, -4.24267578125, -3.8592529296875, -3.475830078125, -3.0924072265625, -2.708984375, -2.3255615234375, -1.942138671875, -1.5587158203125, -1.17529296875, -0.7918701171875, -0.408447265625, -0.0250244140625, 0.3583984375, 0.7418212890625, 1.125244140625, 1.5086669921875, 1.89208984375, 2.2755126953125, 2.658935546875, 3.0423583984375, 3.42578125, 3.8092041015625, 4.192626953125, 4.5760498046875, 4.95947265625, 5.3428955078125, 5.726318359375, 6.1097412109375, 6.4931640625, 6.8765869140625, 7.260009765625, 7.6434326171875, 8.02685546875, 8.4102783203125, 8.793701171875, 9.1771240234375, 9.560546875, 9.9439697265625, 10.327392578125, 10.7108154296875, 11.09423828125, 11.4776611328125, 11.861083984375, 12.2445068359375, 12.6279296875, 13.0113525390625, 13.394775390625, 13.7781982421875, 14.16162109375, 14.5450439453125, 14.928466796875, 15.3118896484375, 15.6953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 5.0, 6.0, 8.0, 7.0, 10.0, 13.0, 17.0, 16.0, 22.0, 32.0, 33.0, 45.0, 67.0, 45.0, 61.0, 78.0, 97.0, 119.0, 158.0, 351.0, 1162.0, 7586.0, 160464.0, 838749.0, 34911.0, 2867.0, 653.0, 239.0, 130.0, 95.0, 77.0, 62.0, 56.0, 61.0, 49.0, 37.0, 28.0, 27.0, 27.0, 16.0, 12.0, 12.0, 13.0, 4.0, 6.0, 4.0, 8.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-12.2578125, -11.8895263671875, -11.521240234375, -11.1529541015625, -10.78466796875, -10.4163818359375, -10.048095703125, -9.6798095703125, -9.3115234375, -8.9432373046875, -8.574951171875, -8.2066650390625, -7.83837890625, -7.4700927734375, -7.101806640625, -6.7335205078125, -6.365234375, -5.9969482421875, -5.628662109375, -5.2603759765625, -4.89208984375, -4.5238037109375, -4.155517578125, -3.7872314453125, -3.4189453125, -3.0506591796875, -2.682373046875, -2.3140869140625, -1.94580078125, -1.5775146484375, -1.209228515625, -0.8409423828125, -0.47265625, -0.1043701171875, 0.263916015625, 0.6322021484375, 1.00048828125, 1.3687744140625, 1.737060546875, 2.1053466796875, 2.4736328125, 2.8419189453125, 3.210205078125, 3.5784912109375, 3.94677734375, 4.3150634765625, 4.683349609375, 5.0516357421875, 5.419921875, 5.7882080078125, 6.156494140625, 6.5247802734375, 6.89306640625, 7.2613525390625, 7.629638671875, 7.9979248046875, 8.3662109375, 8.7344970703125, 9.102783203125, 9.4710693359375, 9.83935546875, 10.2076416015625, 10.575927734375, 10.9442138671875, 11.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 2.0, 14.0, 6.0, 5.0, 12.0, 17.0, 12.0, 16.0, 23.0, 30.0, 23.0, 17.0, 23.0, 27.0, 24.0, 27.0, 31.0, 24.0, 34.0, 46.0, 41.0, 31.0, 40.0, 41.0, 41.0, 25.0, 29.0, 26.0, 25.0, 29.0, 34.0, 16.0, 22.0, 19.0, 21.0, 18.0, 16.0, 16.0, 17.0, 9.0, 7.0, 14.0, 8.0, 13.0, 8.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.55859375, -6.32904052734375, -6.0994873046875, -5.86993408203125, -5.640380859375, -5.41082763671875, -5.1812744140625, -4.95172119140625, -4.72216796875, -4.49261474609375, -4.2630615234375, -4.03350830078125, -3.803955078125, -3.57440185546875, -3.3448486328125, -3.11529541015625, -2.8857421875, -2.65618896484375, -2.4266357421875, -2.19708251953125, -1.967529296875, -1.73797607421875, -1.5084228515625, -1.27886962890625, -1.04931640625, -0.81976318359375, -0.5902099609375, -0.36065673828125, -0.131103515625, 0.09844970703125, 0.3280029296875, 0.55755615234375, 0.787109375, 1.01666259765625, 1.2462158203125, 1.47576904296875, 1.705322265625, 1.93487548828125, 2.1644287109375, 2.39398193359375, 2.62353515625, 2.85308837890625, 3.0826416015625, 3.31219482421875, 3.541748046875, 3.77130126953125, 4.0008544921875, 4.23040771484375, 4.4599609375, 4.68951416015625, 4.9190673828125, 5.14862060546875, 5.378173828125, 5.60772705078125, 5.8372802734375, 6.06683349609375, 6.29638671875, 6.52593994140625, 6.7554931640625, 6.98504638671875, 7.214599609375, 7.44415283203125, 7.6737060546875, 7.90325927734375, 8.1328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 5.0, 10.0, 14.0, 14.0, 33.0, 37.0, 41.0, 88.0, 132.0, 201.0, 366.0, 649.0, 1205.0, 2573.0, 6377.0, 18987.0, 76188.0, 464428.0, 385414.0, 64237.0, 16767.0, 5757.0, 2407.0, 1157.0, 628.0, 288.0, 209.0, 112.0, 68.0, 48.0, 41.0, 11.0, 17.0, 18.0, 5.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.431640625, -1.3868255615234375, -1.342010498046875, -1.2971954345703125, -1.25238037109375, -1.2075653076171875, -1.162750244140625, -1.1179351806640625, -1.0731201171875, -1.0283050537109375, -0.983489990234375, -0.9386749267578125, -0.89385986328125, -0.8490447998046875, -0.804229736328125, -0.7594146728515625, -0.714599609375, -0.6697845458984375, -0.624969482421875, -0.5801544189453125, -0.53533935546875, -0.4905242919921875, -0.445709228515625, -0.4008941650390625, -0.3560791015625, -0.3112640380859375, -0.266448974609375, -0.2216339111328125, -0.17681884765625, -0.1320037841796875, -0.087188720703125, -0.0423736572265625, 0.00244140625, 0.0472564697265625, 0.092071533203125, 0.1368865966796875, 0.18170166015625, 0.2265167236328125, 0.271331787109375, 0.3161468505859375, 0.3609619140625, 0.4057769775390625, 0.450592041015625, 0.4954071044921875, 0.54022216796875, 0.5850372314453125, 0.629852294921875, 0.6746673583984375, 0.719482421875, 0.7642974853515625, 0.809112548828125, 0.8539276123046875, 0.89874267578125, 0.9435577392578125, 0.988372802734375, 1.0331878662109375, 1.0780029296875, 1.1228179931640625, 1.167633056640625, 1.2124481201171875, 1.25726318359375, 1.3020782470703125, 1.346893310546875, 1.3917083740234375, 1.4365234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 3.0, 3.0, 13.0, 13.0, 14.0, 21.0, 29.0, 34.0, 59.0, 68.0, 130.0, 149.0, 132.0, 99.0, 54.0, 45.0, 33.0, 27.0, 20.0, 14.0, 11.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00038170814514160156, -0.00037253648042678833, -0.0003633648157119751, -0.00035419315099716187, -0.00034502148628234863, -0.0003358498215675354, -0.00032667815685272217, -0.00031750649213790894, -0.0003083348274230957, -0.00029916316270828247, -0.00028999149799346924, -0.000280819833278656, -0.0002716481685638428, -0.00026247650384902954, -0.0002533048391342163, -0.00024413317441940308, -0.00023496150970458984, -0.0002257898449897766, -0.00021661818027496338, -0.00020744651556015015, -0.00019827485084533691, -0.00018910318613052368, -0.00017993152141571045, -0.00017075985670089722, -0.00016158819198608398, -0.00015241652727127075, -0.00014324486255645752, -0.0001340731978416443, -0.00012490153312683105, -0.00011572986841201782, -0.00010655820369720459, -9.738653898239136e-05, -8.821487426757812e-05, -7.904320955276489e-05, -6.987154483795166e-05, -6.069988012313843e-05, -5.1528215408325195e-05, -4.235655069351196e-05, -3.318488597869873e-05, -2.4013221263885498e-05, -1.4841556549072266e-05, -5.669891834259033e-06, 3.5017728805541992e-06, 1.2673437595367432e-05, 2.1845102310180664e-05, 3.1016767024993896e-05, 4.018843173980713e-05, 4.936009645462036e-05, 5.8531761169433594e-05, 6.770342588424683e-05, 7.687509059906006e-05, 8.604675531387329e-05, 9.521842002868652e-05, 0.00010439008474349976, 0.00011356174945831299, 0.00012273341417312622, 0.00013190507888793945, 0.00014107674360275269, 0.00015024840831756592, 0.00015942007303237915, 0.00016859173774719238, 0.00017776340246200562, 0.00018693506717681885, 0.00019610673189163208, 0.0002052783966064453]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 9.0, 1.0, 9.0, 13.0, 14.0, 24.0, 23.0, 38.0, 72.0, 112.0, 192.0, 299.0, 610.0, 1276.0, 2851.0, 7168.0, 21804.0, 81037.0, 463672.0, 372739.0, 66759.0, 18569.0, 6239.0, 2567.0, 1133.0, 544.0, 313.0, 167.0, 106.0, 62.0, 42.0, 34.0, 21.0, 13.0, 11.0, 4.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.079681396484375, -1.03045654296875, -0.981231689453125, -0.9320068359375, -0.882781982421875, -0.83355712890625, -0.784332275390625, -0.735107421875, -0.685882568359375, -0.63665771484375, -0.587432861328125, -0.5382080078125, -0.488983154296875, -0.43975830078125, -0.390533447265625, -0.34130859375, -0.292083740234375, -0.24285888671875, -0.193634033203125, -0.1444091796875, -0.095184326171875, -0.04595947265625, 0.003265380859375, 0.052490234375, 0.101715087890625, 0.15093994140625, 0.200164794921875, 0.2493896484375, 0.298614501953125, 0.34783935546875, 0.397064208984375, 0.4462890625, 0.495513916015625, 0.54473876953125, 0.593963623046875, 0.6431884765625, 0.692413330078125, 0.74163818359375, 0.790863037109375, 0.840087890625, 0.889312744140625, 0.93853759765625, 0.987762451171875, 1.0369873046875, 1.086212158203125, 1.13543701171875, 1.184661865234375, 1.23388671875, 1.283111572265625, 1.33233642578125, 1.381561279296875, 1.4307861328125, 1.480010986328125, 1.52923583984375, 1.578460693359375, 1.627685546875, 1.676910400390625, 1.72613525390625, 1.775360107421875, 1.8245849609375, 1.873809814453125, 1.92303466796875, 1.972259521484375, 2.021484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 6.0, 2.0, 4.0, 6.0, 5.0, 8.0, 15.0, 17.0, 20.0, 29.0, 25.0, 43.0, 52.0, 64.0, 91.0, 106.0, 113.0, 89.0, 64.0, 61.0, 50.0, 21.0, 21.0, 17.0, 20.0, 10.0, 12.0, 9.0, 4.0, 6.0, 5.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.931640625, -0.9070281982421875, -0.882415771484375, -0.8578033447265625, -0.83319091796875, -0.8085784912109375, -0.783966064453125, -0.7593536376953125, -0.7347412109375, -0.7101287841796875, -0.685516357421875, -0.6609039306640625, -0.63629150390625, -0.6116790771484375, -0.587066650390625, -0.5624542236328125, -0.537841796875, -0.5132293701171875, -0.488616943359375, -0.4640045166015625, -0.43939208984375, -0.4147796630859375, -0.390167236328125, -0.3655548095703125, -0.3409423828125, -0.3163299560546875, -0.291717529296875, -0.2671051025390625, -0.24249267578125, -0.2178802490234375, -0.193267822265625, -0.1686553955078125, -0.14404296875, -0.1194305419921875, -0.094818115234375, -0.0702056884765625, -0.04559326171875, -0.0209808349609375, 0.003631591796875, 0.0282440185546875, 0.0528564453125, 0.0774688720703125, 0.102081298828125, 0.1266937255859375, 0.15130615234375, 0.1759185791015625, 0.200531005859375, 0.2251434326171875, 0.249755859375, 0.2743682861328125, 0.298980712890625, 0.3235931396484375, 0.34820556640625, 0.3728179931640625, 0.397430419921875, 0.4220428466796875, 0.4466552734375, 0.4712677001953125, 0.495880126953125, 0.5204925537109375, 0.54510498046875, 0.5697174072265625, 0.594329833984375, 0.6189422607421875, 0.6435546875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 15.0, 40.0, 68.0, 103.0, 180.0, 191.0, 187.0, 91.0, 58.0, 26.0, 17.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.85233497619629, -24.03775405883789, -23.22317123413086, -22.40859031677246, -21.59400749206543, -20.77942657470703, -19.96484375, -19.1502628326416, -18.33568000793457, -17.521099090576172, -16.70651626586914, -15.891934394836426, -15.077352523803711, -14.262771606445312, -13.448188781738281, -12.633607864379883, -11.819025993347168, -11.004444122314453, -10.189862251281738, -9.375280380249023, -8.560698509216309, -7.746117115020752, -6.931535243988037, -6.116953372955322, -5.302371501922607, -4.487789630889893, -3.6732077598571777, -2.858626127243042, -2.044044256210327, -1.2294626235961914, -0.41488075256347656, 0.3997011184692383, 1.2142829895019531, 2.028864860534668, 2.843446731567383, 3.6580283641815186, 4.4726104736328125, 5.287191867828369, 6.101773738861084, 6.916355609893799, 7.730937480926514, 8.54551887512207, 9.360100746154785, 10.1746826171875, 10.989264488220215, 11.80384635925293, 12.618428230285645, 13.43301010131836, 14.247591972351074, 15.062173843383789, 15.876755714416504, 16.69133758544922, 17.505918502807617, 18.32050132751465, 19.135082244873047, 19.949665069580078, 20.764245986938477, 21.578826904296875, 22.393409729003906, 23.207990646362305, 24.022573471069336, 24.837154388427734, 25.651737213134766, 26.466318130493164, 27.280900955200195]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 1.0, 7.0, 15.0, 20.0, 24.0, 24.0, 24.0, 18.0, 19.0, 25.0, 29.0, 38.0, 31.0, 52.0, 50.0, 35.0, 49.0, 43.0, 41.0, 41.0, 37.0, 44.0, 27.0, 35.0, 29.0, 33.0, 33.0, 27.0, 20.0, 19.0, 16.0, 17.0, 10.0, 12.0, 13.0, 9.0, 8.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.63160228729248, -12.160292625427246, -11.688982963562012, -11.217673301696777, -10.746363639831543, -10.275053977966309, -9.803743362426758, -9.332433700561523, -8.861124038696289, -8.389814376831055, -7.91850471496582, -7.447195053100586, -6.975885391235352, -6.504575729370117, -6.033265590667725, -5.56195592880249, -5.090646743774414, -4.61933708190918, -4.148027420043945, -3.676717519760132, -3.2054078578948975, -2.734098196029663, -2.2627882957458496, -1.7914786338806152, -1.3201689720153809, -0.8488592505455017, -0.37754952907562256, 0.09376025199890137, 0.5650699138641357, 1.0363795757293701, 1.5076894760131836, 1.978999137878418, 2.4503097534179688, 2.921619415283203, 3.3929290771484375, 3.864238977432251, 4.335548400878906, 4.806858062744141, 5.278168201446533, 5.749477863311768, 6.220787525177002, 6.692097187042236, 7.163406848907471, 7.634716987609863, 8.106026649475098, 8.577336311340332, 9.048645973205566, 9.5199556350708, 9.991265296936035, 10.46257495880127, 10.933884620666504, 11.405194282531738, 11.876503944396973, 12.347813606262207, 12.819124221801758, 13.290433883666992, 13.761743545532227, 14.233053207397461, 14.704362869262695, 15.17567253112793, 15.646982192993164, 16.1182918548584, 16.589601516723633, 17.060911178588867, 17.5322208404541]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 10.0, 7.0, 9.0, 10.0, 11.0, 18.0, 30.0, 36.0, 38.0, 44.0, 71.0, 112.0, 169.0, 278.0, 443.0, 852.0, 1880.0, 4561.0, 12651.0, 56587.0, 545609.0, 3040500.0, 464109.0, 47053.0, 11418.0, 3945.0, 1734.0, 820.0, 464.0, 258.0, 163.0, 108.0, 79.0, 47.0, 43.0, 22.0, 17.0, 16.0, 9.0, 12.0, 12.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.510498046875, -8.20068359375, -7.890869140625, -7.5810546875, -7.271240234375, -6.96142578125, -6.651611328125, -6.341796875, -6.031982421875, -5.72216796875, -5.412353515625, -5.1025390625, -4.792724609375, -4.48291015625, -4.173095703125, -3.86328125, -3.553466796875, -3.24365234375, -2.933837890625, -2.6240234375, -2.314208984375, -2.00439453125, -1.694580078125, -1.384765625, -1.074951171875, -0.76513671875, -0.455322265625, -0.1455078125, 0.164306640625, 0.47412109375, 0.783935546875, 1.09375, 1.403564453125, 1.71337890625, 2.023193359375, 2.3330078125, 2.642822265625, 2.95263671875, 3.262451171875, 3.572265625, 3.882080078125, 4.19189453125, 4.501708984375, 4.8115234375, 5.121337890625, 5.43115234375, 5.740966796875, 6.05078125, 6.360595703125, 6.67041015625, 6.980224609375, 7.2900390625, 7.599853515625, 7.90966796875, 8.219482421875, 8.529296875, 8.839111328125, 9.14892578125, 9.458740234375, 9.7685546875, 10.078369140625, 10.38818359375, 10.697998046875, 11.0078125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 13.0, 14.0, 28.0, 38.0, 28.0, 38.0, 39.0, 65.0, 74.0, 69.0, 63.0, 76.0, 81.0, 63.0, 56.0, 38.0, 43.0, 40.0, 22.0, 22.0, 20.0, 18.0, 13.0, 5.0, 10.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.96533203125, -6.7197265625, -6.47412109375, -6.228515625, -5.98291015625, -5.7373046875, -5.49169921875, -5.24609375, -5.00048828125, -4.7548828125, -4.50927734375, -4.263671875, -4.01806640625, -3.7724609375, -3.52685546875, -3.28125, -3.03564453125, -2.7900390625, -2.54443359375, -2.298828125, -2.05322265625, -1.8076171875, -1.56201171875, -1.31640625, -1.07080078125, -0.8251953125, -0.57958984375, -0.333984375, -0.08837890625, 0.1572265625, 0.40283203125, 0.6484375, 0.89404296875, 1.1396484375, 1.38525390625, 1.630859375, 1.87646484375, 2.1220703125, 2.36767578125, 2.61328125, 2.85888671875, 3.1044921875, 3.35009765625, 3.595703125, 3.84130859375, 4.0869140625, 4.33251953125, 4.578125, 4.82373046875, 5.0693359375, 5.31494140625, 5.560546875, 5.80615234375, 6.0517578125, 6.29736328125, 6.54296875, 6.78857421875, 7.0341796875, 7.27978515625, 7.525390625, 7.77099609375, 8.0166015625, 8.26220703125, 8.5078125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 8.0, 4.0, 11.0, 31.0, 60.0, 105.0, 252.0, 853.0, 10362.0, 3910388.0, 268017.0, 3212.0, 576.0, 190.0, 88.0, 53.0, 19.0, 14.0, 10.0, 9.0, 10.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-43.28125, -42.3154296875, -41.349609375, -40.3837890625, -39.41796875, -38.4521484375, -37.486328125, -36.5205078125, -35.5546875, -34.5888671875, -33.623046875, -32.6572265625, -31.69140625, -30.7255859375, -29.759765625, -28.7939453125, -27.828125, -26.8623046875, -25.896484375, -24.9306640625, -23.96484375, -22.9990234375, -22.033203125, -21.0673828125, -20.1015625, -19.1357421875, -18.169921875, -17.2041015625, -16.23828125, -15.2724609375, -14.306640625, -13.3408203125, -12.375, -11.4091796875, -10.443359375, -9.4775390625, -8.51171875, -7.5458984375, -6.580078125, -5.6142578125, -4.6484375, -3.6826171875, -2.716796875, -1.7509765625, -0.78515625, 0.1806640625, 1.146484375, 2.1123046875, 3.078125, 4.0439453125, 5.009765625, 5.9755859375, 6.94140625, 7.9072265625, 8.873046875, 9.8388671875, 10.8046875, 11.7705078125, 12.736328125, 13.7021484375, 14.66796875, 15.6337890625, 16.599609375, 17.5654296875, 18.53125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 2.0, 3.0, 7.0, 11.0, 8.0, 6.0, 23.0, 23.0, 28.0, 41.0, 53.0, 72.0, 103.0, 146.0, 235.0, 415.0, 621.0, 669.0, 553.0, 366.0, 226.0, 117.0, 96.0, 73.0, 46.0, 30.0, 28.0, 19.0, 15.0, 10.0, 7.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.439453125, -2.36407470703125, -2.2886962890625, -2.21331787109375, -2.137939453125, -2.06256103515625, -1.9871826171875, -1.91180419921875, -1.83642578125, -1.76104736328125, -1.6856689453125, -1.61029052734375, -1.534912109375, -1.45953369140625, -1.3841552734375, -1.30877685546875, -1.2333984375, -1.15802001953125, -1.0826416015625, -1.00726318359375, -0.931884765625, -0.85650634765625, -0.7811279296875, -0.70574951171875, -0.63037109375, -0.55499267578125, -0.4796142578125, -0.40423583984375, -0.328857421875, -0.25347900390625, -0.1781005859375, -0.10272216796875, -0.02734375, 0.04803466796875, 0.1234130859375, 0.19879150390625, 0.274169921875, 0.34954833984375, 0.4249267578125, 0.50030517578125, 0.57568359375, 0.65106201171875, 0.7264404296875, 0.80181884765625, 0.877197265625, 0.95257568359375, 1.0279541015625, 1.10333251953125, 1.1787109375, 1.25408935546875, 1.3294677734375, 1.40484619140625, 1.480224609375, 1.55560302734375, 1.6309814453125, 1.70635986328125, 1.78173828125, 1.85711669921875, 1.9324951171875, 2.00787353515625, 2.083251953125, 2.15863037109375, 2.2340087890625, 2.30938720703125, 2.384765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 7.0, 7.0, 13.0, 26.0, 40.0, 74.0, 87.0, 141.0, 171.0, 153.0, 118.0, 69.0, 48.0, 19.0, 17.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.299962043762207, -6.768779277801514, -6.23759651184082, -5.706414222717285, -5.175231456756592, -4.644048690795898, -4.112866401672363, -3.58168363571167, -3.0505008697509766, -2.519318103790283, -1.988135576248169, -1.4569529294967651, -0.9257702827453613, -0.39458751678466797, 0.1365950107574463, 0.6677775382995605, 1.198960304260254, 1.7301429510116577, 2.2613255977630615, 2.792508125305176, 3.323690891265869, 3.8548736572265625, 4.386055946350098, 4.917238712310791, 5.448421478271484, 5.979604244232178, 6.510787010192871, 7.041969299316406, 7.5731520652771, 8.104334831237793, 8.635517120361328, 9.16670036315918, 9.697881698608398, 10.229063987731934, 10.760247230529785, 11.29142951965332, 11.822612762451172, 12.353795051574707, 12.884977340698242, 13.416160583496094, 13.947342872619629, 14.478525161743164, 15.009708404541016, 15.54089069366455, 16.072072982788086, 16.603256225585938, 17.13443946838379, 17.665620803833008, 18.19680404663086, 18.72798728942871, 19.25916862487793, 19.79035186767578, 20.321535110473633, 20.852718353271484, 21.383899688720703, 21.915082931518555, 22.446266174316406, 22.977449417114258, 23.508630752563477, 24.039813995361328, 24.57099723815918, 25.10218048095703, 25.63336181640625, 26.1645450592041, 26.69572639465332]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 13.0, 14.0, 22.0, 25.0, 32.0, 32.0, 44.0, 61.0, 70.0, 62.0, 54.0, 60.0, 67.0, 60.0, 63.0, 56.0, 48.0, 45.0, 31.0, 38.0, 26.0, 16.0, 13.0, 14.0, 8.0, 4.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.333297729492188, -8.063886642456055, -7.7944746017456055, -7.5250630378723145, -7.255651473999023, -6.986239910125732, -6.716828346252441, -6.44741678237915, -6.178005218505859, -5.908593654632568, -5.639182090759277, -5.369770526885986, -5.100358963012695, -4.830947399139404, -4.561535835266113, -4.292124271392822, -4.022712707519531, -3.7533011436462402, -3.483889579772949, -3.214478015899658, -2.945066452026367, -2.675654888153076, -2.406243324279785, -2.136831760406494, -1.8674201965332031, -1.598008632659912, -1.328597068786621, -1.05918550491333, -0.7897739410400391, -0.520362377166748, -0.25095081329345703, 0.018460750579833984, 0.2878713607788086, 0.5572829246520996, 0.8266944885253906, 1.0961060523986816, 1.3655176162719727, 1.6349291801452637, 1.9043407440185547, 2.1737523078918457, 2.4431638717651367, 2.7125754356384277, 2.9819869995117188, 3.2513985633850098, 3.520810127258301, 3.790221691131592, 4.059633255004883, 4.329044818878174, 4.598456382751465, 4.867867946624756, 5.137279510498047, 5.406691074371338, 5.676102638244629, 5.94551420211792, 6.214925765991211, 6.484337329864502, 6.753748893737793, 7.023160457611084, 7.292572021484375, 7.561983585357666, 7.831395149230957, 8.100807189941406, 8.370218276977539, 8.639629364013672, 8.909041404724121]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 12.0, 9.0, 31.0, 42.0, 116.0, 188.0, 365.0, 749.0, 1710.0, 3889.0, 9678.0, 27898.0, 121484.0, 602505.0, 217107.0, 40629.0, 12915.0, 5126.0, 2111.0, 1024.0, 458.0, 235.0, 121.0, 62.0, 35.0, 16.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7578125, -2.680450439453125, -2.60308837890625, -2.525726318359375, -2.4483642578125, -2.371002197265625, -2.29364013671875, -2.216278076171875, -2.138916015625, -2.061553955078125, -1.98419189453125, -1.906829833984375, -1.8294677734375, -1.752105712890625, -1.67474365234375, -1.597381591796875, -1.52001953125, -1.442657470703125, -1.36529541015625, -1.287933349609375, -1.2105712890625, -1.133209228515625, -1.05584716796875, -0.978485107421875, -0.901123046875, -0.823760986328125, -0.74639892578125, -0.669036865234375, -0.5916748046875, -0.514312744140625, -0.43695068359375, -0.359588623046875, -0.2822265625, -0.204864501953125, -0.12750244140625, -0.050140380859375, 0.0272216796875, 0.104583740234375, 0.18194580078125, 0.259307861328125, 0.336669921875, 0.414031982421875, 0.49139404296875, 0.568756103515625, 0.6461181640625, 0.723480224609375, 0.80084228515625, 0.878204345703125, 0.95556640625, 1.032928466796875, 1.11029052734375, 1.187652587890625, 1.2650146484375, 1.342376708984375, 1.41973876953125, 1.497100830078125, 1.574462890625, 1.651824951171875, 1.72918701171875, 1.806549072265625, 1.8839111328125, 1.961273193359375, 2.03863525390625, 2.115997314453125, 2.193359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 5.0, 6.0, 19.0, 18.0, 34.0, 32.0, 36.0, 57.0, 49.0, 90.0, 76.0, 73.0, 62.0, 64.0, 68.0, 66.0, 62.0, 40.0, 29.0, 37.0, 27.0, 17.0, 8.0, 9.0, 8.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.203125, -5.004638671875, -4.80615234375, -4.607666015625, -4.4091796875, -4.210693359375, -4.01220703125, -3.813720703125, -3.615234375, -3.416748046875, -3.21826171875, -3.019775390625, -2.8212890625, -2.622802734375, -2.42431640625, -2.225830078125, -2.02734375, -1.828857421875, -1.63037109375, -1.431884765625, -1.2333984375, -1.034912109375, -0.83642578125, -0.637939453125, -0.439453125, -0.240966796875, -0.04248046875, 0.156005859375, 0.3544921875, 0.552978515625, 0.75146484375, 0.949951171875, 1.1484375, 1.346923828125, 1.54541015625, 1.743896484375, 1.9423828125, 2.140869140625, 2.33935546875, 2.537841796875, 2.736328125, 2.934814453125, 3.13330078125, 3.331787109375, 3.5302734375, 3.728759765625, 3.92724609375, 4.125732421875, 4.32421875, 4.522705078125, 4.72119140625, 4.919677734375, 5.1181640625, 5.316650390625, 5.51513671875, 5.713623046875, 5.912109375, 6.110595703125, 6.30908203125, 6.507568359375, 6.7060546875, 6.904541015625, 7.10302734375, 7.301513671875, 7.5]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 8.0, 3.0, 9.0, 10.0, 15.0, 30.0, 38.0, 77.0, 124.0, 283.0, 550.0, 1324.0, 3802.0, 11766.0, 52987.0, 525195.0, 396463.0, 40535.0, 9761.0, 3230.0, 1254.0, 528.0, 224.0, 126.0, 66.0, 38.0, 22.0, 10.0, 18.0, 13.0, 7.0, 5.0, 5.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.25, -3.156951904296875, -3.06390380859375, -2.970855712890625, -2.8778076171875, -2.784759521484375, -2.69171142578125, -2.598663330078125, -2.505615234375, -2.412567138671875, -2.31951904296875, -2.226470947265625, -2.1334228515625, -2.040374755859375, -1.94732666015625, -1.854278564453125, -1.76123046875, -1.668182373046875, -1.57513427734375, -1.482086181640625, -1.3890380859375, -1.295989990234375, -1.20294189453125, -1.109893798828125, -1.016845703125, -0.923797607421875, -0.83074951171875, -0.737701416015625, -0.6446533203125, -0.551605224609375, -0.45855712890625, -0.365509033203125, -0.2724609375, -0.179412841796875, -0.08636474609375, 0.006683349609375, 0.0997314453125, 0.192779541015625, 0.28582763671875, 0.378875732421875, 0.471923828125, 0.564971923828125, 0.65802001953125, 0.751068115234375, 0.8441162109375, 0.937164306640625, 1.03021240234375, 1.123260498046875, 1.21630859375, 1.309356689453125, 1.40240478515625, 1.495452880859375, 1.5885009765625, 1.681549072265625, 1.77459716796875, 1.867645263671875, 1.960693359375, 2.053741455078125, 2.14678955078125, 2.239837646484375, 2.3328857421875, 2.425933837890625, 2.51898193359375, 2.612030029296875, 2.705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 5.0, 5.0, 15.0, 7.0, 11.0, 18.0, 18.0, 16.0, 15.0, 27.0, 30.0, 40.0, 33.0, 30.0, 33.0, 36.0, 52.0, 47.0, 37.0, 56.0, 43.0, 43.0, 47.0, 49.0, 40.0, 44.0, 35.0, 27.0, 27.0, 16.0, 20.0, 16.0, 11.0, 16.0, 14.0, 10.0, 6.0, 0.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3125, -8.0380859375, -7.763671875, -7.4892578125, -7.21484375, -6.9404296875, -6.666015625, -6.3916015625, -6.1171875, -5.8427734375, -5.568359375, -5.2939453125, -5.01953125, -4.7451171875, -4.470703125, -4.1962890625, -3.921875, -3.6474609375, -3.373046875, -3.0986328125, -2.82421875, -2.5498046875, -2.275390625, -2.0009765625, -1.7265625, -1.4521484375, -1.177734375, -0.9033203125, -0.62890625, -0.3544921875, -0.080078125, 0.1943359375, 0.46875, 0.7431640625, 1.017578125, 1.2919921875, 1.56640625, 1.8408203125, 2.115234375, 2.3896484375, 2.6640625, 2.9384765625, 3.212890625, 3.4873046875, 3.76171875, 4.0361328125, 4.310546875, 4.5849609375, 4.859375, 5.1337890625, 5.408203125, 5.6826171875, 5.95703125, 6.2314453125, 6.505859375, 6.7802734375, 7.0546875, 7.3291015625, 7.603515625, 7.8779296875, 8.15234375, 8.4267578125, 8.701171875, 8.9755859375, 9.25]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 8.0, 11.0, 20.0, 22.0, 21.0, 38.0, 42.0, 69.0, 102.0, 162.0, 263.0, 473.0, 863.0, 1851.0, 4242.0, 12673.0, 54448.0, 416927.0, 472910.0, 60767.0, 13839.0, 4605.0, 1937.0, 952.0, 518.0, 294.0, 137.0, 118.0, 70.0, 42.0, 41.0, 23.0, 14.0, 9.0, 5.0, 2.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.177734375, -1.145050048828125, -1.11236572265625, -1.079681396484375, -1.0469970703125, -1.014312744140625, -0.98162841796875, -0.948944091796875, -0.916259765625, -0.883575439453125, -0.85089111328125, -0.818206787109375, -0.7855224609375, -0.752838134765625, -0.72015380859375, -0.687469482421875, -0.65478515625, -0.622100830078125, -0.58941650390625, -0.556732177734375, -0.5240478515625, -0.491363525390625, -0.45867919921875, -0.425994873046875, -0.393310546875, -0.360626220703125, -0.32794189453125, -0.295257568359375, -0.2625732421875, -0.229888916015625, -0.19720458984375, -0.164520263671875, -0.1318359375, -0.099151611328125, -0.06646728515625, -0.033782958984375, -0.0010986328125, 0.031585693359375, 0.06427001953125, 0.096954345703125, 0.129638671875, 0.162322998046875, 0.19500732421875, 0.227691650390625, 0.2603759765625, 0.293060302734375, 0.32574462890625, 0.358428955078125, 0.39111328125, 0.423797607421875, 0.45648193359375, 0.489166259765625, 0.5218505859375, 0.554534912109375, 0.58721923828125, 0.619903564453125, 0.652587890625, 0.685272216796875, 0.71795654296875, 0.750640869140625, 0.7833251953125, 0.816009521484375, 0.84869384765625, 0.881378173828125, 0.9140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 4.0, 9.0, 12.0, 7.0, 16.0, 54.0, 68.0, 97.0, 135.0, 180.0, 157.0, 96.0, 72.0, 40.0, 18.0, 14.0, 9.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005178451538085938, -0.0004976168274879456, -0.00047738850116729736, -0.00045716017484664917, -0.000436931848526001, -0.0004167035222053528, -0.0003964751958847046, -0.0003762468695640564, -0.0003560185432434082, -0.00033579021692276, -0.0003155618906021118, -0.0002953335642814636, -0.00027510523796081543, -0.00025487691164016724, -0.00023464858531951904, -0.00021442025899887085, -0.00019419193267822266, -0.00017396360635757446, -0.00015373528003692627, -0.00013350695371627808, -0.00011327862739562988, -9.305030107498169e-05, -7.28219747543335e-05, -5.25936484336853e-05, -3.236532211303711e-05, -1.2136995792388916e-05, 8.091330528259277e-06, 2.831965684890747e-05, 4.8547983169555664e-05, 6.877630949020386e-05, 8.900463581085205e-05, 0.00010923296213150024, 0.00012946128845214844, 0.00014968961477279663, 0.00016991794109344482, 0.00019014626741409302, 0.0002103745937347412, 0.0002306029200553894, 0.0002508312463760376, 0.0002710595726966858, 0.000291287899017334, 0.0003115162253379822, 0.00033174455165863037, 0.00035197287797927856, 0.00037220120429992676, 0.00039242953062057495, 0.00041265785694122314, 0.00043288618326187134, 0.00045311450958251953, 0.0004733428359031677, 0.0004935711622238159, 0.0005137994885444641, 0.0005340278148651123, 0.0005542561411857605, 0.0005744844675064087, 0.0005947127938270569, 0.0006149411201477051, 0.0006351694464683533, 0.0006553977727890015, 0.0006756260991096497, 0.0006958544254302979, 0.000716082751750946, 0.0007363110780715942, 0.0007565394043922424, 0.0007767677307128906]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 7.0, 4.0, 3.0, 9.0, 14.0, 18.0, 27.0, 33.0, 65.0, 105.0, 146.0, 273.0, 493.0, 917.0, 1841.0, 3853.0, 10534.0, 46450.0, 367521.0, 527414.0, 66233.0, 13584.0, 4587.0, 2067.0, 1019.0, 578.0, 307.0, 169.0, 86.0, 73.0, 45.0, 25.0, 16.0, 15.0, 11.0, 11.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.205078125, -1.17169189453125, -1.1383056640625, -1.10491943359375, -1.071533203125, -1.03814697265625, -1.0047607421875, -0.97137451171875, -0.93798828125, -0.90460205078125, -0.8712158203125, -0.83782958984375, -0.804443359375, -0.77105712890625, -0.7376708984375, -0.70428466796875, -0.6708984375, -0.63751220703125, -0.6041259765625, -0.57073974609375, -0.537353515625, -0.50396728515625, -0.4705810546875, -0.43719482421875, -0.40380859375, -0.37042236328125, -0.3370361328125, -0.30364990234375, -0.270263671875, -0.23687744140625, -0.2034912109375, -0.17010498046875, -0.13671875, -0.10333251953125, -0.0699462890625, -0.03656005859375, -0.003173828125, 0.03021240234375, 0.0635986328125, 0.09698486328125, 0.13037109375, 0.16375732421875, 0.1971435546875, 0.23052978515625, 0.263916015625, 0.29730224609375, 0.3306884765625, 0.36407470703125, 0.3974609375, 0.43084716796875, 0.4642333984375, 0.49761962890625, 0.531005859375, 0.56439208984375, 0.5977783203125, 0.63116455078125, 0.66455078125, 0.69793701171875, 0.7313232421875, 0.76470947265625, 0.798095703125, 0.83148193359375, 0.8648681640625, 0.89825439453125, 0.931640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 6.0, 5.0, 13.0, 20.0, 25.0, 41.0, 56.0, 91.0, 112.0, 150.0, 135.0, 112.0, 75.0, 49.0, 40.0, 25.0, 14.0, 7.0, 10.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30712890625, -0.2980155944824219, -0.28890228271484375, -0.2797889709472656, -0.2706756591796875, -0.2615623474121094, -0.25244903564453125, -0.24333572387695312, -0.234222412109375, -0.22510910034179688, -0.21599578857421875, -0.20688247680664062, -0.1977691650390625, -0.18865585327148438, -0.17954254150390625, -0.17042922973632812, -0.16131591796875, -0.15220260620117188, -0.14308929443359375, -0.13397598266601562, -0.1248626708984375, -0.11574935913085938, -0.10663604736328125, -0.09752273559570312, -0.088409423828125, -0.07929611206054688, -0.07018280029296875, -0.061069488525390625, -0.0519561767578125, -0.042842864990234375, -0.03372955322265625, -0.024616241455078125, -0.0155029296875, -0.006389617919921875, 0.00272369384765625, 0.011837005615234375, 0.0209503173828125, 0.030063629150390625, 0.03917694091796875, 0.048290252685546875, 0.057403564453125, 0.06651687622070312, 0.07563018798828125, 0.08474349975585938, 0.0938568115234375, 0.10297012329101562, 0.11208343505859375, 0.12119674682617188, 0.13031005859375, 0.13942337036132812, 0.14853668212890625, 0.15764999389648438, 0.1667633056640625, 0.17587661743164062, 0.18498992919921875, 0.19410324096679688, 0.203216552734375, 0.21232986450195312, 0.22144317626953125, 0.23055648803710938, 0.2396697998046875, 0.24878311157226562, 0.25789642333984375, 0.2670097351074219, 0.276123046875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 10.0, 21.0, 39.0, 55.0, 115.0, 157.0, 224.0, 175.0, 94.0, 55.0, 29.0, 11.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.488933086395264, -5.083921909332275, -4.678911209106445, -4.273900032043457, -3.868889331817627, -3.4638781547546387, -3.0588672161102295, -2.6538562774658203, -2.248845338821411, -1.843834400177002, -1.4388234615325928, -1.033812403678894, -0.6288014650344849, -0.22379040718078613, 0.18122053146362305, 0.5862314701080322, 0.9912424087524414, 1.3962533473968506, 1.8012642860412598, 2.206275463104248, 2.611286163330078, 3.0162973403930664, 3.4213082790374756, 3.8263192176818848, 4.231329917907715, 4.636341094970703, 5.041351795196533, 5.4463629722595215, 5.851373672485352, 6.25638484954834, 6.661396026611328, 7.066406726837158, 7.471417427062988, 7.876428604125977, 8.281439781188965, 8.686450004577637, 9.091461181640625, 9.496472358703613, 9.901483535766602, 10.306493759155273, 10.711504936218262, 11.11651611328125, 11.521527290344238, 11.92653751373291, 12.331548690795898, 12.736559867858887, 13.141571044921875, 13.546581268310547, 13.951593399047852, 14.35660457611084, 14.761615753173828, 15.1666259765625, 15.571637153625488, 15.976648330688477, 16.38165855407715, 16.786670684814453, 17.191680908203125, 17.596691131591797, 18.0017032623291, 18.406713485717773, 18.811725616455078, 19.21673583984375, 19.621746063232422, 20.026758193969727, 20.4317684173584]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 2.0, 5.0, 11.0, 7.0, 9.0, 26.0, 34.0, 37.0, 35.0, 51.0, 63.0, 71.0, 73.0, 64.0, 60.0, 68.0, 67.0, 63.0, 51.0, 46.0, 43.0, 27.0, 34.0, 9.0, 16.0, 12.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3008198738098145, -5.121241569519043, -4.9416632652282715, -4.7620849609375, -4.58250617980957, -4.402927875518799, -4.223349571228027, -4.043771266937256, -3.8641929626464844, -3.684614658355713, -3.5050363540649414, -3.325457811355591, -3.1458795070648193, -2.966301202774048, -2.7867226600646973, -2.607144355773926, -2.4275660514831543, -2.247987747192383, -2.0684094429016113, -1.8888309001922607, -1.7092525959014893, -1.5296742916107178, -1.3500958681106567, -1.1705174446105957, -0.9909391403198242, -0.811360776424408, -0.6317824125289917, -0.45220404863357544, -0.2726256847381592, -0.09304732084274292, 0.08653104305267334, 0.2661094665527344, 0.44568729400634766, 0.6252656579017639, 0.8048440217971802, 0.9844223856925964, 1.1640007495880127, 1.3435790538787842, 1.5231574773788452, 1.7027359008789062, 1.8823142051696777, 2.061892509460449, 2.2414708137512207, 2.4210493564605713, 2.6006276607513428, 2.7802059650421143, 2.959784507751465, 3.1393628120422363, 3.318941116333008, 3.4985194206237793, 3.678097724914551, 3.8576762676239014, 4.037254333496094, 4.216833114624023, 4.396411418914795, 4.575989723205566, 4.755568027496338, 4.935146331787109, 5.114724636077881, 5.294302940368652, 5.473881721496582, 5.6534600257873535, 5.833038330078125, 6.0126166343688965, 6.192194938659668]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 8.0, 6.0, 16.0, 12.0, 39.0, 73.0, 189.0, 676.0, 3007.0, 25392.0, 908994.0, 101551.0, 6866.0, 1224.0, 290.0, 99.0, 37.0, 19.0, 14.0, 11.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.875, -14.390625, -13.90625, -13.421875, -12.9375, -12.453125, -11.96875, -11.484375, -11.0, -10.515625, -10.03125, -9.546875, -9.0625, -8.578125, -8.09375, -7.609375, -7.125, -6.640625, -6.15625, -5.671875, -5.1875, -4.703125, -4.21875, -3.734375, -3.25, -2.765625, -2.28125, -1.796875, -1.3125, -0.828125, -0.34375, 0.140625, 0.625, 1.109375, 1.59375, 2.078125, 2.5625, 3.046875, 3.53125, 4.015625, 4.5, 4.984375, 5.46875, 5.953125, 6.4375, 6.921875, 7.40625, 7.890625, 8.375, 8.859375, 9.34375, 9.828125, 10.3125, 10.796875, 11.28125, 11.765625, 12.25, 12.734375, 13.21875, 13.703125, 14.1875, 14.671875, 15.15625, 15.640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 5.0, 5.0, 4.0, 14.0, 20.0, 19.0, 20.0, 31.0, 32.0, 43.0, 37.0, 38.0, 44.0, 55.0, 60.0, 59.0, 57.0, 48.0, 62.0, 46.0, 49.0, 35.0, 31.0, 28.0, 34.0, 20.0, 21.0, 18.0, 10.0, 13.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.260498046875, -7.94287109375, -7.625244140625, -7.3076171875, -6.989990234375, -6.67236328125, -6.354736328125, -6.037109375, -5.719482421875, -5.40185546875, -5.084228515625, -4.7666015625, -4.448974609375, -4.13134765625, -3.813720703125, -3.49609375, -3.178466796875, -2.86083984375, -2.543212890625, -2.2255859375, -1.907958984375, -1.59033203125, -1.272705078125, -0.955078125, -0.637451171875, -0.31982421875, -0.002197265625, 0.3154296875, 0.633056640625, 0.95068359375, 1.268310546875, 1.5859375, 1.903564453125, 2.22119140625, 2.538818359375, 2.8564453125, 3.174072265625, 3.49169921875, 3.809326171875, 4.126953125, 4.444580078125, 4.76220703125, 5.079833984375, 5.3974609375, 5.715087890625, 6.03271484375, 6.350341796875, 6.66796875, 6.985595703125, 7.30322265625, 7.620849609375, 7.9384765625, 8.256103515625, 8.57373046875, 8.891357421875, 9.208984375, 9.526611328125, 9.84423828125, 10.161865234375, 10.4794921875, 10.797119140625, 11.11474609375, 11.432373046875, 11.75]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 10.0, 10.0, 20.0, 15.0, 33.0, 43.0, 43.0, 44.0, 86.0, 115.0, 205.0, 339.0, 552.0, 964.0, 1761.0, 3723.0, 8752.0, 25747.0, 140137.0, 696985.0, 128013.0, 24828.0, 8420.0, 3607.0, 1766.0, 887.0, 506.0, 281.0, 211.0, 131.0, 82.0, 56.0, 29.0, 26.0, 23.0, 24.0, 18.0, 12.0, 9.0, 4.0, 4.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.609375, -4.4581298828125, -4.306884765625, -4.1556396484375, -4.00439453125, -3.8531494140625, -3.701904296875, -3.5506591796875, -3.3994140625, -3.2481689453125, -3.096923828125, -2.9456787109375, -2.79443359375, -2.6431884765625, -2.491943359375, -2.3406982421875, -2.189453125, -2.0382080078125, -1.886962890625, -1.7357177734375, -1.58447265625, -1.4332275390625, -1.281982421875, -1.1307373046875, -0.9794921875, -0.8282470703125, -0.677001953125, -0.5257568359375, -0.37451171875, -0.2232666015625, -0.072021484375, 0.0792236328125, 0.23046875, 0.3817138671875, 0.532958984375, 0.6842041015625, 0.83544921875, 0.9866943359375, 1.137939453125, 1.2891845703125, 1.4404296875, 1.5916748046875, 1.742919921875, 1.8941650390625, 2.04541015625, 2.1966552734375, 2.347900390625, 2.4991455078125, 2.650390625, 2.8016357421875, 2.952880859375, 3.1041259765625, 3.25537109375, 3.4066162109375, 3.557861328125, 3.7091064453125, 3.8603515625, 4.0115966796875, 4.162841796875, 4.3140869140625, 4.46533203125, 4.6165771484375, 4.767822265625, 4.9190673828125, 5.0703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 9.0, 9.0, 12.0, 10.0, 16.0, 13.0, 13.0, 25.0, 19.0, 20.0, 20.0, 22.0, 29.0, 26.0, 33.0, 34.0, 51.0, 33.0, 29.0, 45.0, 37.0, 43.0, 38.0, 33.0, 42.0, 38.0, 39.0, 23.0, 19.0, 26.0, 23.0, 26.0, 28.0, 9.0, 14.0, 14.0, 12.0, 12.0, 9.0, 4.0, 9.0, 7.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.046875, -8.768310546875, -8.48974609375, -8.211181640625, -7.9326171875, -7.654052734375, -7.37548828125, -7.096923828125, -6.818359375, -6.539794921875, -6.26123046875, -5.982666015625, -5.7041015625, -5.425537109375, -5.14697265625, -4.868408203125, -4.58984375, -4.311279296875, -4.03271484375, -3.754150390625, -3.4755859375, -3.197021484375, -2.91845703125, -2.639892578125, -2.361328125, -2.082763671875, -1.80419921875, -1.525634765625, -1.2470703125, -0.968505859375, -0.68994140625, -0.411376953125, -0.1328125, 0.145751953125, 0.42431640625, 0.702880859375, 0.9814453125, 1.260009765625, 1.53857421875, 1.817138671875, 2.095703125, 2.374267578125, 2.65283203125, 2.931396484375, 3.2099609375, 3.488525390625, 3.76708984375, 4.045654296875, 4.32421875, 4.602783203125, 4.88134765625, 5.159912109375, 5.4384765625, 5.717041015625, 5.99560546875, 6.274169921875, 6.552734375, 6.831298828125, 7.10986328125, 7.388427734375, 7.6669921875, 7.945556640625, 8.22412109375, 8.502685546875, 8.78125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 4.0, 12.0, 9.0, 13.0, 42.0, 47.0, 90.0, 138.0, 288.0, 633.0, 1660.0, 5198.0, 22008.0, 181083.0, 734766.0, 83538.0, 13308.0, 3452.0, 1214.0, 509.0, 207.0, 116.0, 58.0, 47.0, 39.0, 20.0, 11.0, 5.0, 4.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8681640625, -1.8137664794921875, -1.759368896484375, -1.7049713134765625, -1.65057373046875, -1.5961761474609375, -1.541778564453125, -1.4873809814453125, -1.4329833984375, -1.3785858154296875, -1.324188232421875, -1.2697906494140625, -1.21539306640625, -1.1609954833984375, -1.106597900390625, -1.0522003173828125, -0.997802734375, -0.9434051513671875, -0.889007568359375, -0.8346099853515625, -0.78021240234375, -0.7258148193359375, -0.671417236328125, -0.6170196533203125, -0.5626220703125, -0.5082244873046875, -0.453826904296875, -0.3994293212890625, -0.34503173828125, -0.2906341552734375, -0.236236572265625, -0.1818389892578125, -0.12744140625, -0.0730438232421875, -0.018646240234375, 0.0357513427734375, 0.09014892578125, 0.1445465087890625, 0.198944091796875, 0.2533416748046875, 0.3077392578125, 0.3621368408203125, 0.416534423828125, 0.4709320068359375, 0.52532958984375, 0.5797271728515625, 0.634124755859375, 0.6885223388671875, 0.742919921875, 0.7973175048828125, 0.851715087890625, 0.9061126708984375, 0.96051025390625, 1.0149078369140625, 1.069305419921875, 1.1237030029296875, 1.1781005859375, 1.2324981689453125, 1.286895751953125, 1.3412933349609375, 1.39569091796875, 1.4500885009765625, 1.504486083984375, 1.5588836669921875, 1.61328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 10.0, 10.0, 10.0, 20.0, 24.0, 54.0, 52.0, 68.0, 78.0, 134.0, 121.0, 107.0, 86.0, 43.0, 34.0, 23.0, 26.0, 14.0, 14.0, 14.0, 11.0, 5.0, 2.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021791458129882812, -0.00021111778914928436, -0.0002043209969997406, -0.00019752420485019684, -0.00019072741270065308, -0.00018393062055110931, -0.00017713382840156555, -0.0001703370362520218, -0.00016354024410247803, -0.00015674345195293427, -0.0001499466598033905, -0.00014314986765384674, -0.00013635307550430298, -0.00012955628335475922, -0.00012275949120521545, -0.00011596269905567169, -0.00010916590690612793, -0.00010236911475658417, -9.55723226070404e-05, -8.877553045749664e-05, -8.197873830795288e-05, -7.518194615840912e-05, -6.838515400886536e-05, -6.15883618593216e-05, -5.479156970977783e-05, -4.799477756023407e-05, -4.119798541069031e-05, -3.4401193261146545e-05, -2.7604401111602783e-05, -2.080760896205902e-05, -1.4010816812515259e-05, -7.214024662971497e-06, -4.172325134277344e-07, 6.379559636116028e-06, 1.317635178565979e-05, 1.9973143935203552e-05, 2.6769936084747314e-05, 3.356672823429108e-05, 4.036352038383484e-05, 4.71603125333786e-05, 5.395710468292236e-05, 6.0753896832466125e-05, 6.755068898200989e-05, 7.434748113155365e-05, 8.114427328109741e-05, 8.794106543064117e-05, 9.473785758018494e-05, 0.0001015346497297287, 0.00010833144187927246, 0.00011512823402881622, 0.00012192502617835999, 0.00012872181832790375, 0.0001355186104774475, 0.00014231540262699127, 0.00014911219477653503, 0.0001559089869260788, 0.00016270577907562256, 0.00016950257122516632, 0.00017629936337471008, 0.00018309615552425385, 0.0001898929476737976, 0.00019668973982334137, 0.00020348653197288513, 0.0002102833241224289, 0.00021708011627197266]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 7.0, 15.0, 21.0, 12.0, 26.0, 56.0, 112.0, 202.0, 388.0, 828.0, 2201.0, 6532.0, 27012.0, 200285.0, 699816.0, 88072.0, 15625.0, 4411.0, 1552.0, 641.0, 329.0, 169.0, 90.0, 46.0, 32.0, 31.0, 14.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8837890625, -1.8289031982421875, -1.774017333984375, -1.7191314697265625, -1.66424560546875, -1.6093597412109375, -1.554473876953125, -1.4995880126953125, -1.4447021484375, -1.3898162841796875, -1.334930419921875, -1.2800445556640625, -1.22515869140625, -1.1702728271484375, -1.115386962890625, -1.0605010986328125, -1.005615234375, -0.9507293701171875, -0.895843505859375, -0.8409576416015625, -0.78607177734375, -0.7311859130859375, -0.676300048828125, -0.6214141845703125, -0.5665283203125, -0.5116424560546875, -0.456756591796875, -0.4018707275390625, -0.34698486328125, -0.2920989990234375, -0.237213134765625, -0.1823272705078125, -0.12744140625, -0.0725555419921875, -0.017669677734375, 0.0372161865234375, 0.09210205078125, 0.1469879150390625, 0.201873779296875, 0.2567596435546875, 0.3116455078125, 0.3665313720703125, 0.421417236328125, 0.4763031005859375, 0.53118896484375, 0.5860748291015625, 0.640960693359375, 0.6958465576171875, 0.750732421875, 0.8056182861328125, 0.860504150390625, 0.9153900146484375, 0.97027587890625, 1.0251617431640625, 1.080047607421875, 1.1349334716796875, 1.1898193359375, 1.2447052001953125, 1.299591064453125, 1.3544769287109375, 1.40936279296875, 1.4642486572265625, 1.519134521484375, 1.5740203857421875, 1.62890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 7.0, 7.0, 10.0, 16.0, 19.0, 37.0, 52.0, 56.0, 106.0, 143.0, 165.0, 107.0, 64.0, 61.0, 37.0, 31.0, 25.0, 11.0, 9.0, 4.0, 8.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.822265625, -0.791015625, -0.759765625, -0.728515625, -0.697265625, -0.666015625, -0.634765625, -0.603515625, -0.572265625, -0.541015625, -0.509765625, -0.478515625, -0.447265625, -0.416015625, -0.384765625, -0.353515625, -0.322265625, -0.291015625, -0.259765625, -0.228515625, -0.197265625, -0.166015625, -0.134765625, -0.103515625, -0.072265625, -0.041015625, -0.009765625, 0.021484375, 0.052734375, 0.083984375, 0.115234375, 0.146484375, 0.177734375, 0.208984375, 0.240234375, 0.271484375, 0.302734375, 0.333984375, 0.365234375, 0.396484375, 0.427734375, 0.458984375, 0.490234375, 0.521484375, 0.552734375, 0.583984375, 0.615234375, 0.646484375, 0.677734375, 0.708984375, 0.740234375, 0.771484375, 0.802734375, 0.833984375, 0.865234375, 0.896484375, 0.927734375, 0.958984375, 0.990234375, 1.021484375, 1.052734375, 1.083984375, 1.115234375, 1.146484375, 1.177734375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 48.0, 177.0, 395.0, 289.0, 66.0, 21.0, 8.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.83898162841797, -38.08824920654297, -36.33751678466797, -34.5867805480957, -32.8360481262207, -31.085315704345703, -29.33458137512207, -27.583847045898438, -25.833114624023438, -24.082382202148438, -22.331647872924805, -20.580913543701172, -18.830181121826172, -17.079448699951172, -15.328714370727539, -13.577980995178223, -11.827247619628906, -10.07651424407959, -8.325780868530273, -6.575047492980957, -4.824314117431641, -3.073580741882324, -1.3228473663330078, 0.4278860092163086, 2.178619384765625, 3.9293527603149414, 5.680086135864258, 7.430819511413574, 9.18155288696289, 10.932286262512207, 12.683019638061523, 14.43375301361084, 16.184486389160156, 17.935218811035156, 19.68595314025879, 21.436687469482422, 23.187419891357422, 24.938152313232422, 26.688886642456055, 28.439620971679688, 30.190353393554688, 31.941085815429688, 33.69181823730469, 35.44255447387695, 37.19328689575195, 38.94401931762695, 40.69475555419922, 42.44548797607422, 44.19622039794922, 45.94695281982422, 47.69768524169922, 49.448421478271484, 51.199153900146484, 52.949886322021484, 54.70062255859375, 56.45135498046875, 58.20208740234375, 59.95281982421875, 61.70355224609375, 63.454288482666016, 65.20501708984375, 66.95575714111328, 68.70648956298828, 70.45722198486328, 72.20795440673828]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 12.0, 7.0, 13.0, 19.0, 12.0, 16.0, 25.0, 20.0, 23.0, 31.0, 31.0, 41.0, 37.0, 50.0, 45.0, 42.0, 55.0, 48.0, 34.0, 52.0, 41.0, 50.0, 38.0, 34.0, 44.0, 28.0, 28.0, 17.0, 19.0, 21.0, 14.0, 8.0, 11.0, 11.0, 6.0, 4.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.167110443115234, -16.581321716308594, -15.99553108215332, -15.40974235534668, -14.823952674865723, -14.238162994384766, -13.652373313903809, -13.066583633422852, -12.480794906616211, -11.895005226135254, -11.309215545654297, -10.723426818847656, -10.1376371383667, -9.551847457885742, -8.966057777404785, -8.380268096923828, -7.794478416442871, -7.208688735961914, -6.622899532318115, -6.037109851837158, -5.451320648193359, -4.865530967712402, -4.279741287231445, -3.6939520835876465, -3.1081624031066895, -2.5223729610443115, -1.936583399772644, -1.3507938385009766, -0.7650043964385986, -0.1792149543762207, 0.40657472610473633, 0.9923639297485352, 1.5781536102294922, 2.16394305229187, 2.749732494354248, 3.335522174835205, 3.921311616897583, 4.507101058959961, 5.092890739440918, 5.678679943084717, 6.264469623565674, 6.850259304046631, 7.43604850769043, 8.021838188171387, 8.607627868652344, 9.193416595458984, 9.779207229614258, 10.364995956420898, 10.950785636901855, 11.536575317382812, 12.12236499786377, 12.708154678344727, 13.293943405151367, 13.879733085632324, 14.465522766113281, 15.051311492919922, 15.637102127075195, 16.222890853881836, 16.80868148803711, 17.39447021484375, 17.980260848999023, 18.566049575805664, 19.151840209960938, 19.737628936767578, 20.32341766357422]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 2.0, 4.0, 7.0, 9.0, 13.0, 19.0, 22.0, 40.0, 63.0, 96.0, 156.0, 249.0, 416.0, 582.0, 1087.0, 2149.0, 4541.0, 10570.0, 32650.0, 149573.0, 1326510.0, 2315506.0, 275737.0, 48533.0, 14387.0, 5622.0, 2582.0, 1223.0, 731.0, 440.0, 278.0, 145.0, 113.0, 67.0, 52.0, 36.0, 24.0, 12.0, 14.0, 7.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6640625, -5.4388427734375, -5.213623046875, -4.9884033203125, -4.76318359375, -4.5379638671875, -4.312744140625, -4.0875244140625, -3.8623046875, -3.6370849609375, -3.411865234375, -3.1866455078125, -2.96142578125, -2.7362060546875, -2.510986328125, -2.2857666015625, -2.060546875, -1.8353271484375, -1.610107421875, -1.3848876953125, -1.15966796875, -0.9344482421875, -0.709228515625, -0.4840087890625, -0.2587890625, -0.0335693359375, 0.191650390625, 0.4168701171875, 0.64208984375, 0.8673095703125, 1.092529296875, 1.3177490234375, 1.54296875, 1.7681884765625, 1.993408203125, 2.2186279296875, 2.44384765625, 2.6690673828125, 2.894287109375, 3.1195068359375, 3.3447265625, 3.5699462890625, 3.795166015625, 4.0203857421875, 4.24560546875, 4.4708251953125, 4.696044921875, 4.9212646484375, 5.146484375, 5.3717041015625, 5.596923828125, 5.8221435546875, 6.04736328125, 6.2725830078125, 6.497802734375, 6.7230224609375, 6.9482421875, 7.1734619140625, 7.398681640625, 7.6239013671875, 7.84912109375, 8.0743408203125, 8.299560546875, 8.5247802734375, 8.75]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 3.0, 4.0, 11.0, 3.0, 14.0, 24.0, 19.0, 29.0, 43.0, 53.0, 58.0, 82.0, 70.0, 82.0, 85.0, 73.0, 78.0, 50.0, 59.0, 47.0, 21.0, 31.0, 19.0, 10.0, 12.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.13702392578125, -7.8990478515625, -7.66107177734375, -7.423095703125, -7.18511962890625, -6.9471435546875, -6.70916748046875, -6.47119140625, -6.23321533203125, -5.9952392578125, -5.75726318359375, -5.519287109375, -5.28131103515625, -5.0433349609375, -4.80535888671875, -4.5673828125, -4.32940673828125, -4.0914306640625, -3.85345458984375, -3.615478515625, -3.37750244140625, -3.1395263671875, -2.90155029296875, -2.66357421875, -2.42559814453125, -2.1876220703125, -1.94964599609375, -1.711669921875, -1.47369384765625, -1.2357177734375, -0.99774169921875, -0.759765625, -0.52178955078125, -0.2838134765625, -0.04583740234375, 0.192138671875, 0.43011474609375, 0.6680908203125, 0.90606689453125, 1.14404296875, 1.38201904296875, 1.6199951171875, 1.85797119140625, 2.095947265625, 2.33392333984375, 2.5718994140625, 2.80987548828125, 3.0478515625, 3.28582763671875, 3.5238037109375, 3.76177978515625, 3.999755859375, 4.23773193359375, 4.4757080078125, 4.71368408203125, 4.95166015625, 5.18963623046875, 5.4276123046875, 5.66558837890625, 5.903564453125, 6.14154052734375, 6.3795166015625, 6.61749267578125, 6.85546875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 9.0, 12.0, 14.0, 19.0, 23.0, 34.0, 42.0, 89.0, 112.0, 286.0, 581.0, 1468.0, 4606.0, 22773.0, 235000.0, 3626288.0, 270127.0, 24990.0, 5031.0, 1517.0, 568.0, 276.0, 159.0, 70.0, 56.0, 37.0, 22.0, 21.0, 9.0, 11.0, 9.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0], "bins": [-13.1015625, -12.79345703125, -12.4853515625, -12.17724609375, -11.869140625, -11.56103515625, -11.2529296875, -10.94482421875, -10.63671875, -10.32861328125, -10.0205078125, -9.71240234375, -9.404296875, -9.09619140625, -8.7880859375, -8.47998046875, -8.171875, -7.86376953125, -7.5556640625, -7.24755859375, -6.939453125, -6.63134765625, -6.3232421875, -6.01513671875, -5.70703125, -5.39892578125, -5.0908203125, -4.78271484375, -4.474609375, -4.16650390625, -3.8583984375, -3.55029296875, -3.2421875, -2.93408203125, -2.6259765625, -2.31787109375, -2.009765625, -1.70166015625, -1.3935546875, -1.08544921875, -0.77734375, -0.46923828125, -0.1611328125, 0.14697265625, 0.455078125, 0.76318359375, 1.0712890625, 1.37939453125, 1.6875, 1.99560546875, 2.3037109375, 2.61181640625, 2.919921875, 3.22802734375, 3.5361328125, 3.84423828125, 4.15234375, 4.46044921875, 4.7685546875, 5.07666015625, 5.384765625, 5.69287109375, 6.0009765625, 6.30908203125, 6.6171875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 3.0, 7.0, 9.0, 16.0, 19.0, 29.0, 27.0, 50.0, 59.0, 92.0, 147.0, 249.0, 393.0, 591.0, 688.0, 580.0, 363.0, 247.0, 135.0, 113.0, 59.0, 59.0, 41.0, 25.0, 20.0, 11.0, 12.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8505859375, -1.7808990478515625, -1.711212158203125, -1.6415252685546875, -1.57183837890625, -1.5021514892578125, -1.432464599609375, -1.3627777099609375, -1.2930908203125, -1.2234039306640625, -1.153717041015625, -1.0840301513671875, -1.01434326171875, -0.9446563720703125, -0.874969482421875, -0.8052825927734375, -0.735595703125, -0.6659088134765625, -0.596221923828125, -0.5265350341796875, -0.45684814453125, -0.3871612548828125, -0.317474365234375, -0.2477874755859375, -0.1781005859375, -0.1084136962890625, -0.038726806640625, 0.0309600830078125, 0.10064697265625, 0.1703338623046875, 0.240020751953125, 0.3097076416015625, 0.37939453125, 0.4490814208984375, 0.518768310546875, 0.5884552001953125, 0.65814208984375, 0.7278289794921875, 0.797515869140625, 0.8672027587890625, 0.9368896484375, 1.0065765380859375, 1.076263427734375, 1.1459503173828125, 1.21563720703125, 1.2853240966796875, 1.355010986328125, 1.4246978759765625, 1.494384765625, 1.5640716552734375, 1.633758544921875, 1.7034454345703125, 1.77313232421875, 1.8428192138671875, 1.912506103515625, 1.9821929931640625, 2.0518798828125, 2.1215667724609375, 2.191253662109375, 2.2609405517578125, 2.33062744140625, 2.4003143310546875, 2.470001220703125, 2.5396881103515625, 2.609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 9.0, 14.0, 23.0, 31.0, 95.0, 147.0, 196.0, 217.0, 129.0, 74.0, 26.0, 21.0, 12.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.957261085510254, -6.37431001663208, -5.7913594245910645, -5.208408355712891, -4.625457763671875, -4.042506694793701, -3.4595556259155273, -2.8766050338745117, -2.293653964996338, -1.7107031345367432, -1.1277521848678589, -0.5448012351989746, 0.03814959526062012, 0.6211004257202148, 1.2040514945983887, 1.7870020866394043, 2.369953155517578, 2.952903985977173, 3.5358548164367676, 4.118805885314941, 4.701756477355957, 5.284707546234131, 5.867658615112305, 6.45060920715332, 7.033560276031494, 7.616511344909668, 8.199461936950684, 8.782413482666016, 9.365364074707031, 9.948314666748047, 10.531265258789062, 11.114215850830078, 11.697168350219727, 12.280118942260742, 12.863070487976074, 13.44602108001709, 14.028971672058105, 14.611923217773438, 15.194873809814453, 15.777824401855469, 16.360774993896484, 16.9437255859375, 17.526676177978516, 18.10962677001953, 18.69257926940918, 19.275529861450195, 19.85848045349121, 20.441431045532227, 21.024383544921875, 21.60733413696289, 22.190284729003906, 22.773235321044922, 23.35618782043457, 23.939138412475586, 24.5220890045166, 25.105039596557617, 25.687990188598633, 26.27094078063965, 26.853891372680664, 27.436843872070312, 28.019794464111328, 28.602745056152344, 29.18569564819336, 29.768646240234375, 30.35159683227539]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 11.0, 17.0, 28.0, 20.0, 41.0, 47.0, 55.0, 66.0, 79.0, 86.0, 82.0, 69.0, 76.0, 57.0, 58.0, 45.0, 32.0, 37.0, 19.0, 18.0, 14.0, 9.0, 11.0, 8.0, 0.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.815110206604004, -9.547473907470703, -9.279837608337402, -9.012201309204102, -8.744564056396484, -8.476927757263184, -8.209291458129883, -7.941655158996582, -7.674018859863281, -7.4063825607299805, -7.1387457847595215, -6.871109485626221, -6.60347318649292, -6.335836410522461, -6.06820011138916, -5.800563812255859, -5.5329270362854, -5.2652907371521, -4.997653961181641, -4.73001766204834, -4.462381362915039, -4.194745063781738, -3.9271082878112793, -3.6594719886779785, -3.3918354511260986, -3.1241989135742188, -2.856562614440918, -2.588926076889038, -2.321289539337158, -2.0536532402038574, -1.7860167026519775, -1.5183802843093872, -1.2507438659667969, -0.9831074476242065, -0.7154709696769714, -0.44783449172973633, -0.180198073387146, 0.08743834495544434, 0.3550748825073242, 0.6227113008499146, 0.8903477191925049, 1.1579841375350952, 1.4256205558776855, 1.6932570934295654, 1.9608935117721558, 2.228529930114746, 2.496166467666626, 2.763803005218506, 3.0314393043518066, 3.2990758419036865, 3.5667121410369873, 3.834348678588867, 4.101984977722168, 4.369621276855469, 4.637258052825928, 4.9048943519592285, 5.1725311279296875, 5.440167427062988, 5.707804203033447, 5.975440502166748, 6.243076801300049, 6.510713577270508, 6.778349876403809, 7.045986175537109, 7.31362247467041]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 14.0, 17.0, 26.0, 35.0, 76.0, 149.0, 317.0, 612.0, 1350.0, 3429.0, 9776.0, 33207.0, 153376.0, 555861.0, 225012.0, 45063.0, 12692.0, 4380.0, 1703.0, 745.0, 320.0, 141.0, 94.0, 49.0, 34.0, 22.0, 8.0, 10.0, 8.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9298858642578125, -1.872467041015625, -1.8150482177734375, -1.75762939453125, -1.7002105712890625, -1.642791748046875, -1.5853729248046875, -1.5279541015625, -1.4705352783203125, -1.413116455078125, -1.3556976318359375, -1.29827880859375, -1.2408599853515625, -1.183441162109375, -1.1260223388671875, -1.068603515625, -1.0111846923828125, -0.953765869140625, -0.8963470458984375, -0.83892822265625, -0.7815093994140625, -0.724090576171875, -0.6666717529296875, -0.6092529296875, -0.5518341064453125, -0.494415283203125, -0.4369964599609375, -0.37957763671875, -0.3221588134765625, -0.264739990234375, -0.2073211669921875, -0.14990234375, -0.0924835205078125, -0.035064697265625, 0.0223541259765625, 0.07977294921875, 0.1371917724609375, 0.194610595703125, 0.2520294189453125, 0.3094482421875, 0.3668670654296875, 0.424285888671875, 0.4817047119140625, 0.53912353515625, 0.5965423583984375, 0.653961181640625, 0.7113800048828125, 0.768798828125, 0.8262176513671875, 0.883636474609375, 0.9410552978515625, 0.99847412109375, 1.0558929443359375, 1.113311767578125, 1.1707305908203125, 1.2281494140625, 1.2855682373046875, 1.342987060546875, 1.4004058837890625, 1.45782470703125, 1.5152435302734375, 1.572662353515625, 1.6300811767578125, 1.6875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 5.0, 7.0, 5.0, 7.0, 8.0, 16.0, 22.0, 28.0, 38.0, 40.0, 59.0, 73.0, 82.0, 78.0, 73.0, 71.0, 83.0, 58.0, 62.0, 46.0, 26.0, 27.0, 19.0, 19.0, 14.0, 8.0, 12.0, 9.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.83203125, -5.6678466796875, -5.503662109375, -5.3394775390625, -5.17529296875, -5.0111083984375, -4.846923828125, -4.6827392578125, -4.5185546875, -4.3543701171875, -4.190185546875, -4.0260009765625, -3.86181640625, -3.6976318359375, -3.533447265625, -3.3692626953125, -3.205078125, -3.0408935546875, -2.876708984375, -2.7125244140625, -2.54833984375, -2.3841552734375, -2.219970703125, -2.0557861328125, -1.8916015625, -1.7274169921875, -1.563232421875, -1.3990478515625, -1.23486328125, -1.0706787109375, -0.906494140625, -0.7423095703125, -0.578125, -0.4139404296875, -0.249755859375, -0.0855712890625, 0.07861328125, 0.2427978515625, 0.406982421875, 0.5711669921875, 0.7353515625, 0.8995361328125, 1.063720703125, 1.2279052734375, 1.39208984375, 1.5562744140625, 1.720458984375, 1.8846435546875, 2.048828125, 2.2130126953125, 2.377197265625, 2.5413818359375, 2.70556640625, 2.8697509765625, 3.033935546875, 3.1981201171875, 3.3623046875, 3.5264892578125, 3.690673828125, 3.8548583984375, 4.01904296875, 4.1832275390625, 4.347412109375, 4.5115966796875, 4.67578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 13.0, 12.0, 14.0, 23.0, 14.0, 48.0, 51.0, 92.0, 95.0, 179.0, 275.0, 474.0, 815.0, 1487.0, 2906.0, 6127.0, 14327.0, 36377.0, 109493.0, 342788.0, 353051.0, 114361.0, 37917.0, 14656.0, 6304.0, 2960.0, 1518.0, 815.0, 506.0, 303.0, 176.0, 101.0, 70.0, 50.0, 34.0, 25.0, 27.0, 13.0, 8.0, 6.0, 13.0, 7.0, 4.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2919921875, -1.2528533935546875, -1.213714599609375, -1.1745758056640625, -1.13543701171875, -1.0962982177734375, -1.057159423828125, -1.0180206298828125, -0.9788818359375, -0.9397430419921875, -0.900604248046875, -0.8614654541015625, -0.82232666015625, -0.7831878662109375, -0.744049072265625, -0.7049102783203125, -0.665771484375, -0.6266326904296875, -0.587493896484375, -0.5483551025390625, -0.50921630859375, -0.4700775146484375, -0.430938720703125, -0.3917999267578125, -0.3526611328125, -0.3135223388671875, -0.274383544921875, -0.2352447509765625, -0.19610595703125, -0.1569671630859375, -0.117828369140625, -0.0786895751953125, -0.03955078125, -0.0004119873046875, 0.038726806640625, 0.0778656005859375, 0.11700439453125, 0.1561431884765625, 0.195281982421875, 0.2344207763671875, 0.2735595703125, 0.3126983642578125, 0.351837158203125, 0.3909759521484375, 0.43011474609375, 0.4692535400390625, 0.508392333984375, 0.5475311279296875, 0.586669921875, 0.6258087158203125, 0.664947509765625, 0.7040863037109375, 0.74322509765625, 0.7823638916015625, 0.821502685546875, 0.8606414794921875, 0.8997802734375, 0.9389190673828125, 0.978057861328125, 1.0171966552734375, 1.05633544921875, 1.0954742431640625, 1.134613037109375, 1.1737518310546875, 1.212890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 3.0, 8.0, 8.0, 10.0, 16.0, 23.0, 20.0, 19.0, 29.0, 40.0, 27.0, 19.0, 35.0, 43.0, 50.0, 58.0, 53.0, 54.0, 48.0, 51.0, 34.0, 53.0, 43.0, 32.0, 32.0, 27.0, 33.0, 29.0, 14.0, 21.0, 11.0, 7.0, 10.0, 3.0, 13.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.2421875, -7.0162353515625, -6.790283203125, -6.5643310546875, -6.33837890625, -6.1124267578125, -5.886474609375, -5.6605224609375, -5.4345703125, -5.2086181640625, -4.982666015625, -4.7567138671875, -4.53076171875, -4.3048095703125, -4.078857421875, -3.8529052734375, -3.626953125, -3.4010009765625, -3.175048828125, -2.9490966796875, -2.72314453125, -2.4971923828125, -2.271240234375, -2.0452880859375, -1.8193359375, -1.5933837890625, -1.367431640625, -1.1414794921875, -0.91552734375, -0.6895751953125, -0.463623046875, -0.2376708984375, -0.01171875, 0.2142333984375, 0.440185546875, 0.6661376953125, 0.89208984375, 1.1180419921875, 1.343994140625, 1.5699462890625, 1.7958984375, 2.0218505859375, 2.247802734375, 2.4737548828125, 2.69970703125, 2.9256591796875, 3.151611328125, 3.3775634765625, 3.603515625, 3.8294677734375, 4.055419921875, 4.2813720703125, 4.50732421875, 4.7332763671875, 4.959228515625, 5.1851806640625, 5.4111328125, 5.6370849609375, 5.863037109375, 6.0889892578125, 6.31494140625, 6.5408935546875, 6.766845703125, 6.9927978515625, 7.21875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 10.0, 8.0, 13.0, 20.0, 19.0, 32.0, 49.0, 64.0, 85.0, 138.0, 254.0, 426.0, 922.0, 2030.0, 4959.0, 14855.0, 55744.0, 275244.0, 534131.0, 117098.0, 28111.0, 8440.0, 3082.0, 1279.0, 633.0, 355.0, 156.0, 110.0, 86.0, 57.0, 35.0, 22.0, 23.0, 15.0, 4.0, 7.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.69970703125, -0.6773147583007812, -0.6549224853515625, -0.6325302124023438, -0.610137939453125, -0.5877456665039062, -0.5653533935546875, -0.5429611206054688, -0.52056884765625, -0.49817657470703125, -0.4757843017578125, -0.45339202880859375, -0.430999755859375, -0.40860748291015625, -0.3862152099609375, -0.36382293701171875, -0.3414306640625, -0.31903839111328125, -0.2966461181640625, -0.27425384521484375, -0.251861572265625, -0.22946929931640625, -0.2070770263671875, -0.18468475341796875, -0.16229248046875, -0.13990020751953125, -0.1175079345703125, -0.09511566162109375, -0.072723388671875, -0.05033111572265625, -0.0279388427734375, -0.00554656982421875, 0.016845703125, 0.03923797607421875, 0.0616302490234375, 0.08402252197265625, 0.106414794921875, 0.12880706787109375, 0.1511993408203125, 0.17359161376953125, 0.19598388671875, 0.21837615966796875, 0.2407684326171875, 0.26316070556640625, 0.285552978515625, 0.30794525146484375, 0.3303375244140625, 0.35272979736328125, 0.3751220703125, 0.39751434326171875, 0.4199066162109375, 0.44229888916015625, 0.464691162109375, 0.48708343505859375, 0.5094757080078125, 0.5318679809570312, 0.55426025390625, 0.5766525268554688, 0.5990447998046875, 0.6214370727539062, 0.643829345703125, 0.6662216186523438, 0.6886138916015625, 0.7110061645507812, 0.7333984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 9.0, 11.0, 9.0, 15.0, 16.0, 19.0, 29.0, 31.0, 43.0, 71.0, 91.0, 89.0, 114.0, 93.0, 78.0, 70.0, 60.0, 45.0, 27.0, 11.0, 20.0, 12.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002536773681640625, -0.00024364516139030457, -0.00023361295461654663, -0.0002235807478427887, -0.00021354854106903076, -0.00020351633429527283, -0.0001934841275215149, -0.00018345192074775696, -0.00017341971397399902, -0.0001633875072002411, -0.00015335530042648315, -0.00014332309365272522, -0.00013329088687896729, -0.00012325868010520935, -0.00011322647333145142, -0.00010319426655769348, -9.316205978393555e-05, -8.312985301017761e-05, -7.309764623641968e-05, -6.306543946266174e-05, -5.303323268890381e-05, -4.3001025915145874e-05, -3.296881914138794e-05, -2.2936612367630005e-05, -1.290440559387207e-05, -2.8721988201141357e-06, 7.160007953643799e-06, 1.7192214727401733e-05, 2.7224421501159668e-05, 3.72566282749176e-05, 4.728883504867554e-05, 5.732104182243347e-05, 6.73532485961914e-05, 7.738545536994934e-05, 8.741766214370728e-05, 9.744986891746521e-05, 0.00010748207569122314, 0.00011751428246498108, 0.00012754648923873901, 0.00013757869601249695, 0.00014761090278625488, 0.00015764310956001282, 0.00016767531633377075, 0.0001777075231075287, 0.00018773972988128662, 0.00019777193665504456, 0.0002078041434288025, 0.00021783635020256042, 0.00022786855697631836, 0.0002379007637500763, 0.00024793297052383423, 0.00025796517729759216, 0.0002679973840713501, 0.00027802959084510803, 0.00028806179761886597, 0.0002980940043926239, 0.00030812621116638184, 0.00031815841794013977, 0.0003281906247138977, 0.00033822283148765564, 0.0003482550382614136, 0.0003582872450351715, 0.00036831945180892944, 0.0003783516585826874, 0.0003883838653564453]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 13.0, 10.0, 7.0, 10.0, 17.0, 22.0, 25.0, 60.0, 88.0, 107.0, 199.0, 377.0, 735.0, 1535.0, 3965.0, 11700.0, 41051.0, 172096.0, 537301.0, 209036.0, 48591.0, 13495.0, 4530.0, 1746.0, 779.0, 388.0, 256.0, 153.0, 90.0, 48.0, 30.0, 15.0, 15.0, 14.0, 6.0, 5.0, 6.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.69482421875, -0.6747207641601562, -0.6546173095703125, -0.6345138549804688, -0.614410400390625, -0.5943069458007812, -0.5742034912109375, -0.5541000366210938, -0.53399658203125, -0.5138931274414062, -0.4937896728515625, -0.47368621826171875, -0.453582763671875, -0.43347930908203125, -0.4133758544921875, -0.39327239990234375, -0.3731689453125, -0.35306549072265625, -0.3329620361328125, -0.31285858154296875, -0.292755126953125, -0.27265167236328125, -0.2525482177734375, -0.23244476318359375, -0.21234130859375, -0.19223785400390625, -0.1721343994140625, -0.15203094482421875, -0.131927490234375, -0.11182403564453125, -0.0917205810546875, -0.07161712646484375, -0.051513671875, -0.03141021728515625, -0.0113067626953125, 0.00879669189453125, 0.028900146484375, 0.04900360107421875, 0.0691070556640625, 0.08921051025390625, 0.10931396484375, 0.12941741943359375, 0.1495208740234375, 0.16962432861328125, 0.189727783203125, 0.20983123779296875, 0.2299346923828125, 0.25003814697265625, 0.2701416015625, 0.29024505615234375, 0.3103485107421875, 0.33045196533203125, 0.350555419921875, 0.37065887451171875, 0.3907623291015625, 0.41086578369140625, 0.43096923828125, 0.45107269287109375, 0.4711761474609375, 0.49127960205078125, 0.511383056640625, 0.5314865112304688, 0.5515899658203125, 0.5716934204101562, 0.591796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 14.0, 12.0, 15.0, 17.0, 26.0, 30.0, 36.0, 31.0, 44.0, 51.0, 55.0, 80.0, 65.0, 90.0, 67.0, 57.0, 50.0, 43.0, 40.0, 27.0, 17.0, 20.0, 17.0, 15.0, 10.0, 10.0, 6.0, 4.0, 8.0, 7.0, 2.0, 4.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.13055419921875, -0.12646484375, -0.12237548828125, -0.1182861328125, -0.11419677734375, -0.110107421875, -0.10601806640625, -0.1019287109375, -0.09783935546875, -0.09375, -0.08966064453125, -0.0855712890625, -0.08148193359375, -0.077392578125, -0.07330322265625, -0.0692138671875, -0.06512451171875, -0.06103515625, -0.05694580078125, -0.0528564453125, -0.04876708984375, -0.044677734375, -0.04058837890625, -0.0364990234375, -0.03240966796875, -0.0283203125, -0.02423095703125, -0.0201416015625, -0.01605224609375, -0.011962890625, -0.00787353515625, -0.0037841796875, 0.00030517578125, 0.00439453125, 0.00848388671875, 0.0125732421875, 0.01666259765625, 0.020751953125, 0.02484130859375, 0.0289306640625, 0.03302001953125, 0.037109375, 0.04119873046875, 0.0452880859375, 0.04937744140625, 0.053466796875, 0.05755615234375, 0.0616455078125, 0.06573486328125, 0.06982421875, 0.07391357421875, 0.0780029296875, 0.08209228515625, 0.086181640625, 0.09027099609375, 0.0943603515625, 0.09844970703125, 0.1025390625, 0.10662841796875, 0.1107177734375, 0.11480712890625, 0.118896484375, 0.12298583984375, 0.1270751953125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 15.0, 35.0, 107.0, 206.0, 305.0, 174.0, 88.0, 32.0, 17.0, 11.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.790182113647461, -5.328359127044678, -4.866536617279053, -4.4047136306762695, -3.9428911209106445, -3.4810681343078613, -3.0192453861236572, -2.557422637939453, -2.095599889755249, -1.633777141571045, -1.1719543933868408, -0.7101315259933472, -0.24830877780914307, 0.21351408958435059, 0.6753368377685547, 1.1371595859527588, 1.598982334136963, 2.060805082321167, 2.522627830505371, 2.9844508171081543, 3.4462733268737793, 3.9080963134765625, 4.3699188232421875, 4.831741809844971, 5.293564796447754, 5.755387783050537, 6.217210292816162, 6.679033279418945, 7.14085578918457, 7.6026787757873535, 8.064501762390137, 8.526324272155762, 8.988146781921387, 9.449969291687012, 9.911792755126953, 10.373615264892578, 10.835437774658203, 11.297260284423828, 11.75908374786377, 12.220906257629395, 12.68272876739502, 13.144551277160645, 13.606374740600586, 14.068197250366211, 14.530019760131836, 14.991842269897461, 15.453665733337402, 15.915488243103027, 16.37731170654297, 16.839134216308594, 17.30095672607422, 17.762779235839844, 18.2246036529541, 18.686426162719727, 19.14824867248535, 19.610071182250977, 20.0718936920166, 20.533716201782227, 20.99553871154785, 21.457361221313477, 21.919185638427734, 22.38100814819336, 22.842830657958984, 23.30465316772461, 23.766475677490234]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 8.0, 4.0, 14.0, 14.0, 26.0, 32.0, 42.0, 51.0, 49.0, 92.0, 92.0, 84.0, 93.0, 74.0, 70.0, 61.0, 45.0, 37.0, 28.0, 32.0, 17.0, 7.0, 8.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.942391872406006, -5.76731538772583, -5.592238426208496, -5.41716194152832, -5.2420854568481445, -5.067008972167969, -4.891932010650635, -4.716855525970459, -4.541778564453125, -4.366702079772949, -4.191625118255615, -4.0165486335754395, -3.8414721488952637, -3.666395425796509, -3.491318702697754, -3.316242218017578, -3.1411657333374023, -2.9660890102386475, -2.7910125255584717, -2.615935802459717, -2.440859317779541, -2.265782594680786, -2.0907058715820312, -1.915629267692566, -1.7405526638031006, -1.5654760599136353, -1.39039945602417, -1.215322732925415, -1.0402461290359497, -0.8651695251464844, -0.6900928020477295, -0.5150161981582642, -0.3399391174316406, -0.1648624837398529, 0.010214149951934814, 0.18529081344604492, 0.36036741733551025, 0.5354440212249756, 0.7105207443237305, 0.8855973482131958, 1.0606739521026611, 1.2357505559921265, 1.4108271598815918, 1.5859038829803467, 1.760980486869812, 1.9360570907592773, 2.1111338138580322, 2.286210536956787, 2.461287021636963, 2.6363637447357178, 2.8114402294158936, 2.9865169525146484, 3.161593437194824, 3.336670160293579, 3.511746883392334, 3.6868233680725098, 3.8619000911712646, 4.0369768142700195, 4.212053298950195, 4.387129783630371, 4.562206745147705, 4.737283229827881, 4.912360191345215, 5.087436676025391, 5.262513160705566]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 7.0, 4.0, 8.0, 8.0, 11.0, 32.0, 32.0, 53.0, 89.0, 147.0, 250.0, 425.0, 803.0, 1567.0, 3432.0, 8851.0, 29017.0, 147637.0, 629087.0, 176607.0, 33114.0, 9974.0, 3749.0, 1705.0, 864.0, 446.0, 251.0, 148.0, 90.0, 58.0, 27.0, 27.0, 18.0, 6.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6484375, -4.517669677734375, -4.38690185546875, -4.256134033203125, -4.1253662109375, -3.994598388671875, -3.86383056640625, -3.733062744140625, -3.602294921875, -3.471527099609375, -3.34075927734375, -3.209991455078125, -3.0792236328125, -2.948455810546875, -2.81768798828125, -2.686920166015625, -2.55615234375, -2.425384521484375, -2.29461669921875, -2.163848876953125, -2.0330810546875, -1.902313232421875, -1.77154541015625, -1.640777587890625, -1.510009765625, -1.379241943359375, -1.24847412109375, -1.117706298828125, -0.9869384765625, -0.856170654296875, -0.72540283203125, -0.594635009765625, -0.4638671875, -0.333099365234375, -0.20233154296875, -0.071563720703125, 0.0592041015625, 0.189971923828125, 0.32073974609375, 0.451507568359375, 0.582275390625, 0.713043212890625, 0.84381103515625, 0.974578857421875, 1.1053466796875, 1.236114501953125, 1.36688232421875, 1.497650146484375, 1.62841796875, 1.759185791015625, 1.88995361328125, 2.020721435546875, 2.1514892578125, 2.282257080078125, 2.41302490234375, 2.543792724609375, 2.674560546875, 2.805328369140625, 2.93609619140625, 3.066864013671875, 3.1976318359375, 3.328399658203125, 3.45916748046875, 3.589935302734375, 3.720703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 12.0, 19.0, 20.0, 30.0, 41.0, 42.0, 62.0, 80.0, 80.0, 97.0, 99.0, 76.0, 70.0, 61.0, 43.0, 38.0, 29.0, 34.0, 24.0, 7.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.546875, -15.117919921875, -14.68896484375, -14.260009765625, -13.8310546875, -13.402099609375, -12.97314453125, -12.544189453125, -12.115234375, -11.686279296875, -11.25732421875, -10.828369140625, -10.3994140625, -9.970458984375, -9.54150390625, -9.112548828125, -8.68359375, -8.254638671875, -7.82568359375, -7.396728515625, -6.9677734375, -6.538818359375, -6.10986328125, -5.680908203125, -5.251953125, -4.822998046875, -4.39404296875, -3.965087890625, -3.5361328125, -3.107177734375, -2.67822265625, -2.249267578125, -1.8203125, -1.391357421875, -0.96240234375, -0.533447265625, -0.1044921875, 0.324462890625, 0.75341796875, 1.182373046875, 1.611328125, 2.040283203125, 2.46923828125, 2.898193359375, 3.3271484375, 3.756103515625, 4.18505859375, 4.614013671875, 5.04296875, 5.471923828125, 5.90087890625, 6.329833984375, 6.7587890625, 7.187744140625, 7.61669921875, 8.045654296875, 8.474609375, 8.903564453125, 9.33251953125, 9.761474609375, 10.1904296875, 10.619384765625, 11.04833984375, 11.477294921875, 11.90625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 9.0, 10.0, 13.0, 24.0, 40.0, 33.0, 63.0, 68.0, 102.0, 117.0, 229.0, 459.0, 1027.0, 3240.0, 14592.0, 137748.0, 775267.0, 98878.0, 11794.0, 2783.0, 940.0, 418.0, 190.0, 134.0, 88.0, 66.0, 43.0, 46.0, 24.0, 28.0, 16.0, 13.0, 8.0, 6.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.32513427734375, -5.1658935546875, -5.00665283203125, -4.847412109375, -4.68817138671875, -4.5289306640625, -4.36968994140625, -4.21044921875, -4.05120849609375, -3.8919677734375, -3.73272705078125, -3.573486328125, -3.41424560546875, -3.2550048828125, -3.09576416015625, -2.9365234375, -2.77728271484375, -2.6180419921875, -2.45880126953125, -2.299560546875, -2.14031982421875, -1.9810791015625, -1.82183837890625, -1.66259765625, -1.50335693359375, -1.3441162109375, -1.18487548828125, -1.025634765625, -0.86639404296875, -0.7071533203125, -0.54791259765625, -0.388671875, -0.22943115234375, -0.0701904296875, 0.08905029296875, 0.248291015625, 0.40753173828125, 0.5667724609375, 0.72601318359375, 0.88525390625, 1.04449462890625, 1.2037353515625, 1.36297607421875, 1.522216796875, 1.68145751953125, 1.8406982421875, 1.99993896484375, 2.1591796875, 2.31842041015625, 2.4776611328125, 2.63690185546875, 2.796142578125, 2.95538330078125, 3.1146240234375, 3.27386474609375, 3.43310546875, 3.59234619140625, 3.7515869140625, 3.91082763671875, 4.070068359375, 4.22930908203125, 4.3885498046875, 4.54779052734375, 4.70703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 4.0, 3.0, 9.0, 10.0, 21.0, 25.0, 24.0, 20.0, 31.0, 38.0, 43.0, 40.0, 52.0, 57.0, 54.0, 51.0, 44.0, 70.0, 48.0, 39.0, 45.0, 51.0, 34.0, 32.0, 28.0, 24.0, 29.0, 13.0, 16.0, 12.0, 5.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7421875, -10.383544921875, -10.02490234375, -9.666259765625, -9.3076171875, -8.948974609375, -8.59033203125, -8.231689453125, -7.873046875, -7.514404296875, -7.15576171875, -6.797119140625, -6.4384765625, -6.079833984375, -5.72119140625, -5.362548828125, -5.00390625, -4.645263671875, -4.28662109375, -3.927978515625, -3.5693359375, -3.210693359375, -2.85205078125, -2.493408203125, -2.134765625, -1.776123046875, -1.41748046875, -1.058837890625, -0.7001953125, -0.341552734375, 0.01708984375, 0.375732421875, 0.734375, 1.093017578125, 1.45166015625, 1.810302734375, 2.1689453125, 2.527587890625, 2.88623046875, 3.244873046875, 3.603515625, 3.962158203125, 4.32080078125, 4.679443359375, 5.0380859375, 5.396728515625, 5.75537109375, 6.114013671875, 6.47265625, 6.831298828125, 7.18994140625, 7.548583984375, 7.9072265625, 8.265869140625, 8.62451171875, 8.983154296875, 9.341796875, 9.700439453125, 10.05908203125, 10.417724609375, 10.7763671875, 11.135009765625, 11.49365234375, 11.852294921875, 12.2109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 11.0, 5.0, 21.0, 20.0, 40.0, 54.0, 92.0, 132.0, 252.0, 503.0, 1041.0, 2455.0, 7247.0, 31399.0, 197328.0, 652133.0, 124641.0, 21541.0, 5567.0, 2023.0, 889.0, 461.0, 240.0, 137.0, 94.0, 63.0, 47.0, 16.0, 19.0, 17.0, 6.0, 8.0, 2.0, 3.0, 2.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1845703125, -1.1428375244140625, -1.101104736328125, -1.0593719482421875, -1.01763916015625, -0.9759063720703125, -0.934173583984375, -0.8924407958984375, -0.8507080078125, -0.8089752197265625, -0.767242431640625, -0.7255096435546875, -0.68377685546875, -0.6420440673828125, -0.600311279296875, -0.5585784912109375, -0.516845703125, -0.4751129150390625, -0.433380126953125, -0.3916473388671875, -0.34991455078125, -0.3081817626953125, -0.266448974609375, -0.2247161865234375, -0.1829833984375, -0.1412506103515625, -0.099517822265625, -0.0577850341796875, -0.01605224609375, 0.0256805419921875, 0.067413330078125, 0.1091461181640625, 0.15087890625, 0.1926116943359375, 0.234344482421875, 0.2760772705078125, 0.31781005859375, 0.3595428466796875, 0.401275634765625, 0.4430084228515625, 0.4847412109375, 0.5264739990234375, 0.568206787109375, 0.6099395751953125, 0.65167236328125, 0.6934051513671875, 0.735137939453125, 0.7768707275390625, 0.818603515625, 0.8603363037109375, 0.902069091796875, 0.9438018798828125, 0.98553466796875, 1.0272674560546875, 1.069000244140625, 1.1107330322265625, 1.1524658203125, 1.1941986083984375, 1.235931396484375, 1.2776641845703125, 1.31939697265625, 1.3611297607421875, 1.402862548828125, 1.4445953369140625, 1.486328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 12.0, 12.0, 15.0, 14.0, 37.0, 39.0, 49.0, 66.0, 97.0, 117.0, 123.0, 88.0, 75.0, 59.0, 43.0, 38.0, 38.0, 13.0, 16.0, 10.0, 4.0, 5.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002123117446899414, -0.00020629167556762695, -0.0002002716064453125, -0.00019425153732299805, -0.0001882314682006836, -0.00018221139907836914, -0.0001761913299560547, -0.00017017126083374023, -0.00016415119171142578, -0.00015813112258911133, -0.00015211105346679688, -0.00014609098434448242, -0.00014007091522216797, -0.00013405084609985352, -0.00012803077697753906, -0.00012201070785522461, -0.00011599063873291016, -0.0001099705696105957, -0.00010395050048828125, -9.79304313659668e-05, -9.191036224365234e-05, -8.589029312133789e-05, -7.987022399902344e-05, -7.385015487670898e-05, -6.783008575439453e-05, -6.181001663208008e-05, -5.5789947509765625e-05, -4.976987838745117e-05, -4.374980926513672e-05, -3.7729740142822266e-05, -3.170967102050781e-05, -2.568960189819336e-05, -1.9669532775878906e-05, -1.3649463653564453e-05, -7.62939453125e-06, -1.6093254089355469e-06, 4.410743713378906e-06, 1.043081283569336e-05, 1.6450881958007812e-05, 2.2470951080322266e-05, 2.849102020263672e-05, 3.451108932495117e-05, 4.0531158447265625e-05, 4.655122756958008e-05, 5.257129669189453e-05, 5.8591365814208984e-05, 6.461143493652344e-05, 7.063150405883789e-05, 7.665157318115234e-05, 8.26716423034668e-05, 8.869171142578125e-05, 9.47117805480957e-05, 0.00010073184967041016, 0.00010675191879272461, 0.00011277198791503906, 0.00011879205703735352, 0.00012481212615966797, 0.00013083219528198242, 0.00013685226440429688, 0.00014287233352661133, 0.00014889240264892578, 0.00015491247177124023, 0.0001609325408935547, 0.00016695261001586914, 0.0001729726791381836]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 12.0, 25.0, 22.0, 36.0, 51.0, 67.0, 126.0, 191.0, 332.0, 604.0, 1243.0, 2655.0, 6156.0, 17062.0, 59246.0, 275438.0, 529469.0, 110626.0, 28248.0, 9400.0, 3878.0, 1743.0, 830.0, 402.0, 211.0, 146.0, 88.0, 62.0, 40.0, 29.0, 26.0, 14.0, 15.0, 5.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.16015625, -1.1252288818359375, -1.090301513671875, -1.0553741455078125, -1.02044677734375, -0.9855194091796875, -0.950592041015625, -0.9156646728515625, -0.8807373046875, -0.8458099365234375, -0.810882568359375, -0.7759552001953125, -0.74102783203125, -0.7061004638671875, -0.671173095703125, -0.6362457275390625, -0.601318359375, -0.5663909912109375, -0.531463623046875, -0.4965362548828125, -0.46160888671875, -0.4266815185546875, -0.391754150390625, -0.3568267822265625, -0.3218994140625, -0.2869720458984375, -0.252044677734375, -0.2171173095703125, -0.18218994140625, -0.1472625732421875, -0.112335205078125, -0.0774078369140625, -0.04248046875, -0.0075531005859375, 0.027374267578125, 0.0623016357421875, 0.09722900390625, 0.1321563720703125, 0.167083740234375, 0.2020111083984375, 0.2369384765625, 0.2718658447265625, 0.306793212890625, 0.3417205810546875, 0.37664794921875, 0.4115753173828125, 0.446502685546875, 0.4814300537109375, 0.516357421875, 0.5512847900390625, 0.586212158203125, 0.6211395263671875, 0.65606689453125, 0.6909942626953125, 0.725921630859375, 0.7608489990234375, 0.7957763671875, 0.8307037353515625, 0.865631103515625, 0.9005584716796875, 0.93548583984375, 0.9704132080078125, 1.005340576171875, 1.0402679443359375, 1.0751953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 5.0, 3.0, 8.0, 10.0, 6.0, 11.0, 14.0, 12.0, 25.0, 33.0, 30.0, 35.0, 37.0, 49.0, 50.0, 77.0, 89.0, 90.0, 70.0, 68.0, 54.0, 31.0, 30.0, 24.0, 21.0, 17.0, 18.0, 20.0, 11.0, 7.0, 3.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.537109375, -0.5192642211914062, -0.5014190673828125, -0.48357391357421875, -0.465728759765625, -0.44788360595703125, -0.4300384521484375, -0.41219329833984375, -0.39434814453125, -0.37650299072265625, -0.3586578369140625, -0.34081268310546875, -0.322967529296875, -0.30512237548828125, -0.2872772216796875, -0.26943206787109375, -0.2515869140625, -0.23374176025390625, -0.2158966064453125, -0.19805145263671875, -0.180206298828125, -0.16236114501953125, -0.1445159912109375, -0.12667083740234375, -0.10882568359375, -0.09098052978515625, -0.0731353759765625, -0.05529022216796875, -0.037445068359375, -0.01959991455078125, -0.0017547607421875, 0.01609039306640625, 0.033935546875, 0.05178070068359375, 0.0696258544921875, 0.08747100830078125, 0.105316162109375, 0.12316131591796875, 0.1410064697265625, 0.15885162353515625, 0.17669677734375, 0.19454193115234375, 0.2123870849609375, 0.23023223876953125, 0.248077392578125, 0.26592254638671875, 0.2837677001953125, 0.30161285400390625, 0.3194580078125, 0.33730316162109375, 0.3551483154296875, 0.37299346923828125, 0.390838623046875, 0.40868377685546875, 0.4265289306640625, 0.44437408447265625, 0.46221923828125, 0.48006439208984375, 0.4979095458984375, 0.5157546997070312, 0.533599853515625, 0.5514450073242188, 0.5692901611328125, 0.5871353149414062, 0.60498046875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 9.0, 36.0, 95.0, 299.0, 361.0, 134.0, 41.0, 18.0, 8.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.893125534057617, -22.651193618774414, -21.409259796142578, -20.167327880859375, -18.925395965576172, -17.68346405029297, -16.441532135009766, -15.19959831237793, -13.957666397094727, -12.715734481811523, -11.473801612854004, -10.231868743896484, -8.989936828613281, -7.74800443649292, -6.506072044372559, -5.264139175415039, -4.022207260131836, -2.7802748680114746, -1.5383424758911133, -0.29641008377075195, 0.9455223083496094, 2.1874547004699707, 3.429387092590332, 4.671319961547852, 5.913251876831055, 7.155184268951416, 8.397116661071777, 9.639049530029297, 10.8809814453125, 12.122913360595703, 13.364846229553223, 14.606779098510742, 15.848712921142578, 17.09064483642578, 18.332576751708984, 19.57451057434082, 20.816442489624023, 22.058374404907227, 23.300308227539062, 24.542240142822266, 25.78417205810547, 27.026103973388672, 28.268035888671875, 29.50996971130371, 30.751901626586914, 31.993833541870117, 33.23576736450195, 34.477699279785156, 35.71963119506836, 36.96156311035156, 38.203495025634766, 39.44542694091797, 40.68736267089844, 41.92929458618164, 43.171226501464844, 44.41315841674805, 45.65509033203125, 46.89702224731445, 48.138954162597656, 49.38088607788086, 50.62281799316406, 51.86475372314453, 53.106685638427734, 54.34861755371094, 55.59054946899414]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 9.0, 5.0, 10.0, 12.0, 11.0, 24.0, 20.0, 22.0, 17.0, 24.0, 33.0, 37.0, 30.0, 25.0, 36.0, 39.0, 40.0, 40.0, 45.0, 45.0, 40.0, 53.0, 46.0, 32.0, 29.0, 35.0, 24.0, 31.0, 28.0, 32.0, 24.0, 13.0, 13.0, 16.0, 13.0, 14.0, 8.0, 5.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0], "bins": [-18.27943992614746, -17.77526092529297, -17.271081924438477, -16.766902923583984, -16.26272201538086, -15.758543968200684, -15.254364013671875, -14.750185012817383, -14.24600601196289, -13.741827011108398, -13.237648010253906, -12.733468055725098, -12.229289054870605, -11.725110054016113, -11.220930099487305, -10.716751098632812, -10.21257209777832, -9.708393096923828, -9.204214096069336, -8.700034141540527, -8.195855140686035, -7.691676139831543, -7.187496662139893, -6.683317184448242, -6.17913818359375, -5.674959182739258, -5.170779705047607, -4.666600227355957, -4.162421226501465, -3.6582419872283936, -3.1540627479553223, -2.649883508682251, -2.145705223083496, -1.6415259838104248, -1.1373467445373535, -0.6331675052642822, -0.12898826599121094, 0.37519097328186035, 0.8793702125549316, 1.383549451828003, 1.8877286911010742, 2.3919079303741455, 2.896087169647217, 3.400266408920288, 3.9044456481933594, 4.408624649047852, 4.912804126739502, 5.416983604431152, 5.9211626052856445, 6.425341606140137, 6.929521083831787, 7.4337005615234375, 7.93787956237793, 8.442058563232422, 8.946237564086914, 9.450417518615723, 9.954596519470215, 10.458775520324707, 10.962955474853516, 11.467134475708008, 11.9713134765625, 12.475492477416992, 12.979671478271484, 13.483851432800293, 13.988030433654785]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 12.0, 21.0, 52.0, 77.0, 179.0, 385.0, 869.0, 2071.0, 5376.0, 18121.0, 108619.0, 1881463.0, 2035230.0, 114075.0, 18938.0, 5304.0, 1903.0, 811.0, 340.0, 184.0, 102.0, 52.0, 34.0, 18.0, 16.0, 6.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0078125, -5.721923828125, -5.43603515625, -5.150146484375, -4.8642578125, -4.578369140625, -4.29248046875, -4.006591796875, -3.720703125, -3.434814453125, -3.14892578125, -2.863037109375, -2.5771484375, -2.291259765625, -2.00537109375, -1.719482421875, -1.43359375, -1.147705078125, -0.86181640625, -0.575927734375, -0.2900390625, -0.004150390625, 0.28173828125, 0.567626953125, 0.853515625, 1.139404296875, 1.42529296875, 1.711181640625, 1.9970703125, 2.282958984375, 2.56884765625, 2.854736328125, 3.140625, 3.426513671875, 3.71240234375, 3.998291015625, 4.2841796875, 4.570068359375, 4.85595703125, 5.141845703125, 5.427734375, 5.713623046875, 5.99951171875, 6.285400390625, 6.5712890625, 6.857177734375, 7.14306640625, 7.428955078125, 7.71484375, 8.000732421875, 8.28662109375, 8.572509765625, 8.8583984375, 9.144287109375, 9.43017578125, 9.716064453125, 10.001953125, 10.287841796875, 10.57373046875, 10.859619140625, 11.1455078125, 11.431396484375, 11.71728515625, 12.003173828125, 12.2890625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 1.0, 5.0, 5.0, 14.0, 10.0, 17.0, 36.0, 46.0, 51.0, 78.0, 99.0, 104.0, 128.0, 87.0, 97.0, 56.0, 57.0, 44.0, 24.0, 13.0, 13.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.1964111328125, -7.916259765625, -7.6361083984375, -7.35595703125, -7.0758056640625, -6.795654296875, -6.5155029296875, -6.2353515625, -5.9552001953125, -5.675048828125, -5.3948974609375, -5.11474609375, -4.8345947265625, -4.554443359375, -4.2742919921875, -3.994140625, -3.7139892578125, -3.433837890625, -3.1536865234375, -2.87353515625, -2.5933837890625, -2.313232421875, -2.0330810546875, -1.7529296875, -1.4727783203125, -1.192626953125, -0.9124755859375, -0.63232421875, -0.3521728515625, -0.072021484375, 0.2081298828125, 0.48828125, 0.7684326171875, 1.048583984375, 1.3287353515625, 1.60888671875, 1.8890380859375, 2.169189453125, 2.4493408203125, 2.7294921875, 3.0096435546875, 3.289794921875, 3.5699462890625, 3.85009765625, 4.1302490234375, 4.410400390625, 4.6905517578125, 4.970703125, 5.2508544921875, 5.531005859375, 5.8111572265625, 6.09130859375, 6.3714599609375, 6.651611328125, 6.9317626953125, 7.2119140625, 7.4920654296875, 7.772216796875, 8.0523681640625, 8.33251953125, 8.6126708984375, 8.892822265625, 9.1729736328125, 9.453125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 9.0, 6.0, 16.0, 13.0, 25.0, 34.0, 35.0, 68.0, 121.0, 204.0, 443.0, 1215.0, 4322.0, 22133.0, 224127.0, 3667950.0, 243732.0, 23027.0, 4540.0, 1279.0, 457.0, 210.0, 105.0, 77.0, 39.0, 28.0, 26.0, 10.0, 14.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.1328125, -9.8211669921875, -9.509521484375, -9.1978759765625, -8.88623046875, -8.5745849609375, -8.262939453125, -7.9512939453125, -7.6396484375, -7.3280029296875, -7.016357421875, -6.7047119140625, -6.39306640625, -6.0814208984375, -5.769775390625, -5.4581298828125, -5.146484375, -4.8348388671875, -4.523193359375, -4.2115478515625, -3.89990234375, -3.5882568359375, -3.276611328125, -2.9649658203125, -2.6533203125, -2.3416748046875, -2.030029296875, -1.7183837890625, -1.40673828125, -1.0950927734375, -0.783447265625, -0.4718017578125, -0.16015625, 0.1514892578125, 0.463134765625, 0.7747802734375, 1.08642578125, 1.3980712890625, 1.709716796875, 2.0213623046875, 2.3330078125, 2.6446533203125, 2.956298828125, 3.2679443359375, 3.57958984375, 3.8912353515625, 4.202880859375, 4.5145263671875, 4.826171875, 5.1378173828125, 5.449462890625, 5.7611083984375, 6.07275390625, 6.3843994140625, 6.696044921875, 7.0076904296875, 7.3193359375, 7.6309814453125, 7.942626953125, 8.2542724609375, 8.56591796875, 8.8775634765625, 9.189208984375, 9.5008544921875, 9.8125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 7.0, 13.0, 15.0, 23.0, 29.0, 52.0, 71.0, 87.0, 156.0, 270.0, 408.0, 670.0, 688.0, 567.0, 355.0, 219.0, 118.0, 70.0, 68.0, 42.0, 34.0, 20.0, 20.0, 19.0, 11.0, 7.0, 4.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.255859375, -2.188262939453125, -2.12066650390625, -2.053070068359375, -1.9854736328125, -1.917877197265625, -1.85028076171875, -1.782684326171875, -1.715087890625, -1.647491455078125, -1.57989501953125, -1.512298583984375, -1.4447021484375, -1.377105712890625, -1.30950927734375, -1.241912841796875, -1.17431640625, -1.106719970703125, -1.03912353515625, -0.971527099609375, -0.9039306640625, -0.836334228515625, -0.76873779296875, -0.701141357421875, -0.633544921875, -0.565948486328125, -0.49835205078125, -0.430755615234375, -0.3631591796875, -0.295562744140625, -0.22796630859375, -0.160369873046875, -0.0927734375, -0.025177001953125, 0.04241943359375, 0.110015869140625, 0.1776123046875, 0.245208740234375, 0.31280517578125, 0.380401611328125, 0.447998046875, 0.515594482421875, 0.58319091796875, 0.650787353515625, 0.7183837890625, 0.785980224609375, 0.85357666015625, 0.921173095703125, 0.98876953125, 1.056365966796875, 1.12396240234375, 1.191558837890625, 1.2591552734375, 1.326751708984375, 1.39434814453125, 1.461944580078125, 1.529541015625, 1.597137451171875, 1.66473388671875, 1.732330322265625, 1.7999267578125, 1.867523193359375, 1.93511962890625, 2.002716064453125, 2.0703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 6.0, 13.0, 18.0, 32.0, 63.0, 103.0, 214.0, 205.0, 148.0, 94.0, 59.0, 19.0, 15.0, 8.0, 5.0, 5.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9347662925720215, -5.412812232971191, -4.8908586502075195, -4.368905067443848, -3.8469510078430176, -3.3249971866607666, -2.8030433654785156, -2.2810895442962646, -1.7591357231140137, -1.2371819019317627, -0.7152280807495117, -0.19327425956726074, 0.32867956161499023, 0.8506333827972412, 1.3725872039794922, 1.8945410251617432, 2.416494846343994, 2.938448667526245, 3.460402488708496, 3.982356309890747, 4.504310131072998, 5.026264190673828, 5.5482177734375, 6.070171356201172, 6.592125415802002, 7.114079475402832, 7.636033058166504, 8.157986640930176, 8.679941177368164, 9.201894760131836, 9.723848342895508, 10.24580192565918, 10.767755508422852, 11.289709091186523, 11.811662673950195, 12.333617210388184, 12.855570793151855, 13.377524375915527, 13.899478912353516, 14.421432495117188, 14.94338607788086, 15.465339660644531, 15.987293243408203, 16.509246826171875, 17.031200408935547, 17.55315589904785, 18.075109481811523, 18.597063064575195, 19.119016647338867, 19.64097023010254, 20.16292381286621, 20.684877395629883, 21.206832885742188, 21.72878646850586, 22.25074005126953, 22.772693634033203, 23.294647216796875, 23.816600799560547, 24.33855438232422, 24.86050796508789, 25.382461547851562, 25.904417037963867, 26.42637062072754, 26.94832420349121, 27.470277786254883]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 1.0, 6.0, 10.0, 13.0, 25.0, 24.0, 21.0, 33.0, 31.0, 47.0, 57.0, 73.0, 65.0, 76.0, 58.0, 69.0, 76.0, 70.0, 49.0, 46.0, 41.0, 28.0, 16.0, 13.0, 16.0, 9.0, 10.0, 2.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.259030818939209, -7.041027069091797, -6.823023796081543, -6.605020046234131, -6.387016296386719, -6.169013023376465, -5.951009273529053, -5.733005523681641, -5.515002250671387, -5.296998500823975, -5.078995227813721, -4.860991477966309, -4.6429877281188965, -4.424984455108643, -4.2069807052612305, -3.9889771938323975, -3.7709734439849854, -3.5529699325561523, -3.3349661827087402, -3.1169626712799072, -2.898959159851074, -2.680955410003662, -2.462951898574829, -2.244948387145996, -2.026944637298584, -1.8089410066604614, -1.5909374952316284, -1.3729338645935059, -1.1549303531646729, -0.9369267225265503, -0.7189230918884277, -0.5009195804595947, -0.2829160690307617, -0.06491248309612274, 0.15309110283851624, 0.3710947036743164, 0.5890982747077942, 0.807101845741272, 1.0251054763793945, 1.2431089878082275, 1.46111261844635, 1.6791162490844727, 1.8971197605133057, 2.1151232719421387, 2.333127021789551, 2.551130533218384, 2.769134044647217, 2.987137794494629, 3.205141305923462, 3.423144817352295, 3.641148567199707, 3.85915207862854, 4.077155590057373, 4.295159339904785, 4.513162612915039, 4.731166362762451, 4.949170112609863, 5.167173862457275, 5.385177135467529, 5.603180885314941, 5.8211846351623535, 6.039187908172607, 6.2571916580200195, 6.475194931030273, 6.6931986808776855]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 6.0, 10.0, 8.0, 21.0, 23.0, 28.0, 63.0, 98.0, 186.0, 358.0, 631.0, 1432.0, 3807.0, 11427.0, 40153.0, 178351.0, 553683.0, 195354.0, 43454.0, 12361.0, 4054.0, 1647.0, 664.0, 306.0, 134.0, 105.0, 68.0, 34.0, 28.0, 16.0, 13.0, 4.0, 9.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.80859375, -1.747344970703125, -1.68609619140625, -1.624847412109375, -1.5635986328125, -1.502349853515625, -1.44110107421875, -1.379852294921875, -1.318603515625, -1.257354736328125, -1.19610595703125, -1.134857177734375, -1.0736083984375, -1.012359619140625, -0.95111083984375, -0.889862060546875, -0.82861328125, -0.767364501953125, -0.70611572265625, -0.644866943359375, -0.5836181640625, -0.522369384765625, -0.46112060546875, -0.399871826171875, -0.338623046875, -0.277374267578125, -0.21612548828125, -0.154876708984375, -0.0936279296875, -0.032379150390625, 0.02886962890625, 0.090118408203125, 0.1513671875, 0.212615966796875, 0.27386474609375, 0.335113525390625, 0.3963623046875, 0.457611083984375, 0.51885986328125, 0.580108642578125, 0.641357421875, 0.702606201171875, 0.76385498046875, 0.825103759765625, 0.8863525390625, 0.947601318359375, 1.00885009765625, 1.070098876953125, 1.13134765625, 1.192596435546875, 1.25384521484375, 1.315093994140625, 1.3763427734375, 1.437591552734375, 1.49884033203125, 1.560089111328125, 1.621337890625, 1.682586669921875, 1.74383544921875, 1.805084228515625, 1.8663330078125, 1.927581787109375, 1.98883056640625, 2.050079345703125, 2.111328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 2.0, 7.0, 6.0, 18.0, 13.0, 19.0, 33.0, 28.0, 40.0, 55.0, 73.0, 67.0, 84.0, 74.0, 72.0, 84.0, 75.0, 58.0, 45.0, 39.0, 29.0, 14.0, 15.0, 14.0, 9.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2109375, -5.0560302734375, -4.901123046875, -4.7462158203125, -4.59130859375, -4.4364013671875, -4.281494140625, -4.1265869140625, -3.9716796875, -3.8167724609375, -3.661865234375, -3.5069580078125, -3.35205078125, -3.1971435546875, -3.042236328125, -2.8873291015625, -2.732421875, -2.5775146484375, -2.422607421875, -2.2677001953125, -2.11279296875, -1.9578857421875, -1.802978515625, -1.6480712890625, -1.4931640625, -1.3382568359375, -1.183349609375, -1.0284423828125, -0.87353515625, -0.7186279296875, -0.563720703125, -0.4088134765625, -0.25390625, -0.0989990234375, 0.055908203125, 0.2108154296875, 0.36572265625, 0.5206298828125, 0.675537109375, 0.8304443359375, 0.9853515625, 1.1402587890625, 1.295166015625, 1.4500732421875, 1.60498046875, 1.7598876953125, 1.914794921875, 2.0697021484375, 2.224609375, 2.3795166015625, 2.534423828125, 2.6893310546875, 2.84423828125, 2.9991455078125, 3.154052734375, 3.3089599609375, 3.4638671875, 3.6187744140625, 3.773681640625, 3.9285888671875, 4.08349609375, 4.2384033203125, 4.393310546875, 4.5482177734375, 4.703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 5.0, 10.0, 14.0, 14.0, 20.0, 32.0, 59.0, 72.0, 110.0, 170.0, 297.0, 479.0, 948.0, 2077.0, 4968.0, 13480.0, 40137.0, 148622.0, 461973.0, 271484.0, 68709.0, 21405.0, 7525.0, 3017.0, 1343.0, 651.0, 351.0, 186.0, 130.0, 86.0, 51.0, 31.0, 23.0, 17.0, 15.0, 13.0, 4.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3759765625, -1.3296661376953125, -1.283355712890625, -1.2370452880859375, -1.19073486328125, -1.1444244384765625, -1.098114013671875, -1.0518035888671875, -1.0054931640625, -0.9591827392578125, -0.912872314453125, -0.8665618896484375, -0.82025146484375, -0.7739410400390625, -0.727630615234375, -0.6813201904296875, -0.635009765625, -0.5886993408203125, -0.542388916015625, -0.4960784912109375, -0.44976806640625, -0.4034576416015625, -0.357147216796875, -0.3108367919921875, -0.2645263671875, -0.2182159423828125, -0.171905517578125, -0.1255950927734375, -0.07928466796875, -0.0329742431640625, 0.013336181640625, 0.0596466064453125, 0.10595703125, 0.1522674560546875, 0.198577880859375, 0.2448883056640625, 0.29119873046875, 0.3375091552734375, 0.383819580078125, 0.4301300048828125, 0.4764404296875, 0.5227508544921875, 0.569061279296875, 0.6153717041015625, 0.66168212890625, 0.7079925537109375, 0.754302978515625, 0.8006134033203125, 0.846923828125, 0.8932342529296875, 0.939544677734375, 0.9858551025390625, 1.03216552734375, 1.0784759521484375, 1.124786376953125, 1.1710968017578125, 1.2174072265625, 1.2637176513671875, 1.310028076171875, 1.3563385009765625, 1.40264892578125, 1.4489593505859375, 1.495269775390625, 1.5415802001953125, 1.587890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 14.0, 7.0, 17.0, 13.0, 16.0, 29.0, 26.0, 25.0, 48.0, 40.0, 42.0, 40.0, 50.0, 59.0, 56.0, 60.0, 44.0, 53.0, 36.0, 46.0, 45.0, 36.0, 25.0, 25.0, 25.0, 17.0, 21.0, 23.0, 15.0, 8.0, 8.0, 6.0, 8.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.058349609375, -5.82763671875, -5.596923828125, -5.3662109375, -5.135498046875, -4.90478515625, -4.674072265625, -4.443359375, -4.212646484375, -3.98193359375, -3.751220703125, -3.5205078125, -3.289794921875, -3.05908203125, -2.828369140625, -2.59765625, -2.366943359375, -2.13623046875, -1.905517578125, -1.6748046875, -1.444091796875, -1.21337890625, -0.982666015625, -0.751953125, -0.521240234375, -0.29052734375, -0.059814453125, 0.1708984375, 0.401611328125, 0.63232421875, 0.863037109375, 1.09375, 1.324462890625, 1.55517578125, 1.785888671875, 2.0166015625, 2.247314453125, 2.47802734375, 2.708740234375, 2.939453125, 3.170166015625, 3.40087890625, 3.631591796875, 3.8623046875, 4.093017578125, 4.32373046875, 4.554443359375, 4.78515625, 5.015869140625, 5.24658203125, 5.477294921875, 5.7080078125, 5.938720703125, 6.16943359375, 6.400146484375, 6.630859375, 6.861572265625, 7.09228515625, 7.322998046875, 7.5537109375, 7.784423828125, 8.01513671875, 8.245849609375, 8.4765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 9.0, 8.0, 8.0, 24.0, 40.0, 68.0, 105.0, 191.0, 355.0, 693.0, 1527.0, 3528.0, 9058.0, 27585.0, 114422.0, 485689.0, 313396.0, 63266.0, 17650.0, 6043.0, 2527.0, 1131.0, 576.0, 273.0, 140.0, 97.0, 46.0, 32.0, 17.0, 12.0, 7.0, 8.0, 5.0, 5.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.6777114868164062, -0.6557159423828125, -0.6337203979492188, -0.611724853515625, -0.5897293090820312, -0.5677337646484375, -0.5457382202148438, -0.52374267578125, -0.5017471313476562, -0.4797515869140625, -0.45775604248046875, -0.435760498046875, -0.41376495361328125, -0.3917694091796875, -0.36977386474609375, -0.3477783203125, -0.32578277587890625, -0.3037872314453125, -0.28179168701171875, -0.259796142578125, -0.23780059814453125, -0.2158050537109375, -0.19380950927734375, -0.17181396484375, -0.14981842041015625, -0.1278228759765625, -0.10582733154296875, -0.083831787109375, -0.06183624267578125, -0.0398406982421875, -0.01784515380859375, 0.004150390625, 0.02614593505859375, 0.0481414794921875, 0.07013702392578125, 0.092132568359375, 0.11412811279296875, 0.1361236572265625, 0.15811920166015625, 0.18011474609375, 0.20211029052734375, 0.2241058349609375, 0.24610137939453125, 0.268096923828125, 0.29009246826171875, 0.3120880126953125, 0.33408355712890625, 0.3560791015625, 0.37807464599609375, 0.4000701904296875, 0.42206573486328125, 0.444061279296875, 0.46605682373046875, 0.4880523681640625, 0.5100479125976562, 0.53204345703125, 0.5540390014648438, 0.5760345458984375, 0.5980300903320312, 0.620025634765625, 0.6420211791992188, 0.6640167236328125, 0.6860122680664062, 0.7080078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 4.0, 11.0, 6.0, 6.0, 2.0, 15.0, 9.0, 15.0, 10.0, 31.0, 33.0, 33.0, 50.0, 77.0, 60.0, 84.0, 99.0, 76.0, 73.0, 64.0, 42.0, 44.0, 29.0, 38.0, 24.0, 20.0, 10.0, 4.0, 9.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.000339508056640625, -0.0003306921571493149, -0.00032187625765800476, -0.00031306035816669464, -0.0003042444586753845, -0.0002954285591840744, -0.0002866126596927643, -0.00027779676020145416, -0.00026898086071014404, -0.0002601649612188339, -0.0002513490617275238, -0.00024253316223621368, -0.00023371726274490356, -0.00022490136325359344, -0.00021608546376228333, -0.0002072695642709732, -0.00019845366477966309, -0.00018963776528835297, -0.00018082186579704285, -0.00017200596630573273, -0.0001631900668144226, -0.0001543741673231125, -0.00014555826783180237, -0.00013674236834049225, -0.00012792646884918213, -0.00011911056935787201, -0.00011029466986656189, -0.00010147877037525177, -9.266287088394165e-05, -8.384697139263153e-05, -7.503107190132141e-05, -6.621517241001129e-05, -5.739927291870117e-05, -4.858337342739105e-05, -3.976747393608093e-05, -3.095157444477081e-05, -2.2135674953460693e-05, -1.3319775462150574e-05, -4.503875970840454e-06, 4.3120235204696655e-06, 1.3127923011779785e-05, 2.1943822503089905e-05, 3.0759721994400024e-05, 3.9575621485710144e-05, 4.8391520977020264e-05, 5.720742046833038e-05, 6.60233199596405e-05, 7.483921945095062e-05, 8.365511894226074e-05, 9.247101843357086e-05, 0.00010128691792488098, 0.0001101028174161911, 0.00011891871690750122, 0.00012773461639881134, 0.00013655051589012146, 0.00014536641538143158, 0.0001541823148727417, 0.00016299821436405182, 0.00017181411385536194, 0.00018063001334667206, 0.00018944591283798218, 0.0001982618123292923, 0.00020707771182060242, 0.00021589361131191254, 0.00022470951080322266]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 11.0, 9.0, 13.0, 20.0, 23.0, 39.0, 47.0, 59.0, 121.0, 147.0, 235.0, 399.0, 700.0, 1283.0, 2549.0, 5720.0, 13822.0, 40216.0, 142618.0, 427585.0, 291387.0, 79435.0, 24579.0, 9145.0, 3991.0, 1953.0, 987.0, 513.0, 339.0, 185.0, 112.0, 81.0, 70.0, 36.0, 33.0, 24.0, 11.0, 6.0, 8.0, 14.0, 7.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5595703125, -0.541961669921875, -0.52435302734375, -0.506744384765625, -0.4891357421875, -0.471527099609375, -0.45391845703125, -0.436309814453125, -0.418701171875, -0.401092529296875, -0.38348388671875, -0.365875244140625, -0.3482666015625, -0.330657958984375, -0.31304931640625, -0.295440673828125, -0.27783203125, -0.260223388671875, -0.24261474609375, -0.225006103515625, -0.2073974609375, -0.189788818359375, -0.17218017578125, -0.154571533203125, -0.136962890625, -0.119354248046875, -0.10174560546875, -0.084136962890625, -0.0665283203125, -0.048919677734375, -0.03131103515625, -0.013702392578125, 0.00390625, 0.021514892578125, 0.03912353515625, 0.056732177734375, 0.0743408203125, 0.091949462890625, 0.10955810546875, 0.127166748046875, 0.144775390625, 0.162384033203125, 0.17999267578125, 0.197601318359375, 0.2152099609375, 0.232818603515625, 0.25042724609375, 0.268035888671875, 0.28564453125, 0.303253173828125, 0.32086181640625, 0.338470458984375, 0.3560791015625, 0.373687744140625, 0.39129638671875, 0.408905029296875, 0.426513671875, 0.444122314453125, 0.46173095703125, 0.479339599609375, 0.4969482421875, 0.514556884765625, 0.53216552734375, 0.549774169921875, 0.5673828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 8.0, 6.0, 10.0, 12.0, 16.0, 14.0, 20.0, 21.0, 24.0, 33.0, 38.0, 32.0, 47.0, 55.0, 64.0, 66.0, 62.0, 64.0, 52.0, 56.0, 40.0, 42.0, 34.0, 30.0, 30.0, 20.0, 21.0, 11.0, 11.0, 10.0, 8.0, 6.0, 5.0, 3.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1219482421875, -0.11791229248046875, -0.1138763427734375, -0.10984039306640625, -0.105804443359375, -0.10176849365234375, -0.0977325439453125, -0.09369659423828125, -0.08966064453125, -0.08562469482421875, -0.0815887451171875, -0.07755279541015625, -0.073516845703125, -0.06948089599609375, -0.0654449462890625, -0.06140899658203125, -0.057373046875, -0.05333709716796875, -0.0493011474609375, -0.04526519775390625, -0.041229248046875, -0.03719329833984375, -0.0331573486328125, -0.02912139892578125, -0.02508544921875, -0.02104949951171875, -0.0170135498046875, -0.01297760009765625, -0.008941650390625, -0.00490570068359375, -0.0008697509765625, 0.00316619873046875, 0.0072021484375, 0.01123809814453125, 0.0152740478515625, 0.01930999755859375, 0.023345947265625, 0.02738189697265625, 0.0314178466796875, 0.03545379638671875, 0.03948974609375, 0.04352569580078125, 0.0475616455078125, 0.05159759521484375, 0.055633544921875, 0.05966949462890625, 0.0637054443359375, 0.06774139404296875, 0.07177734375, 0.07581329345703125, 0.0798492431640625, 0.08388519287109375, 0.087921142578125, 0.09195709228515625, 0.0959930419921875, 0.10002899169921875, 0.10406494140625, 0.10810089111328125, 0.1121368408203125, 0.11617279052734375, 0.120208740234375, 0.12424468994140625, 0.1282806396484375, 0.13231658935546875, 0.1363525390625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 5.0, 10.0, 22.0, 36.0, 76.0, 168.0, 256.0, 202.0, 113.0, 63.0, 20.0, 13.0, 13.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0867180824279785, -3.7099244594573975, -3.3331308364868164, -2.9563372135162354, -2.5795435905456543, -2.2027499675750732, -1.8259563446044922, -1.4491627216339111, -1.07236909866333, -0.695575475692749, -0.31878185272216797, 0.058011770248413086, 0.43480539321899414, 0.8115990161895752, 1.1883926391601562, 1.5651862621307373, 1.9419798851013184, 2.3187735080718994, 2.6955671310424805, 3.0723607540130615, 3.4491543769836426, 3.8259479999542236, 4.202741622924805, 4.579535484313965, 4.956328868865967, 5.333122253417969, 5.709916114807129, 6.086709976196289, 6.463503360748291, 6.840296745300293, 7.217090606689453, 7.593884468078613, 7.970678329467773, 8.347472190856934, 8.724266052246094, 9.101058959960938, 9.477852821350098, 9.854646682739258, 10.231439590454102, 10.608233451843262, 10.985027313232422, 11.361821174621582, 11.738615036010742, 12.115407943725586, 12.492201805114746, 12.868995666503906, 13.24578857421875, 13.62258243560791, 13.99937629699707, 14.37617015838623, 14.75296401977539, 15.129756927490234, 15.506550788879395, 15.883344650268555, 16.2601375579834, 16.636932373046875, 17.01372528076172, 17.390518188476562, 17.76731300354004, 18.144105911254883, 18.52090072631836, 18.897693634033203, 19.274486541748047, 19.651281356811523, 20.028074264526367]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 8.0, 19.0, 25.0, 25.0, 26.0, 46.0, 33.0, 58.0, 74.0, 74.0, 82.0, 68.0, 69.0, 75.0, 82.0, 57.0, 48.0, 28.0, 25.0, 18.0, 14.0, 8.0, 9.0, 4.0, 7.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.580511569976807, -4.429073810577393, -4.2776360511779785, -4.1261982917785645, -3.9747607707977295, -3.8233230113983154, -3.6718854904174805, -3.5204477310180664, -3.3690099716186523, -3.2175722122192383, -3.066134452819824, -2.9146969318389893, -2.763259172439575, -2.611821413040161, -2.460383892059326, -2.308946132659912, -2.157508373260498, -2.006070613861084, -1.8546329736709595, -1.703195333480835, -1.551757574081421, -1.4003198146820068, -1.2488821744918823, -1.0974445343017578, -0.9460067749023438, -0.7945690751075745, -0.6431313753128052, -0.4916936755180359, -0.3402559757232666, -0.18881827592849731, -0.03738057613372803, 0.11405706405639648, 0.26549482345581055, 0.41693252325057983, 0.5683702230453491, 0.7198079228401184, 0.8712456226348877, 1.0226833820343018, 1.1741210222244263, 1.3255586624145508, 1.4769964218139648, 1.628434181213379, 1.7798718214035034, 1.931309461593628, 2.082747220993042, 2.234184980392456, 2.385622501373291, 2.537060260772705, 2.688498020172119, 2.839935779571533, 2.9913735389709473, 3.1428110599517822, 3.2942488193511963, 3.4456865787506104, 3.5971240997314453, 3.7485618591308594, 3.8999996185302734, 4.0514373779296875, 4.202875137329102, 4.354312896728516, 4.50575065612793, 4.6571879386901855, 4.8086256980896, 4.960063457489014, 5.111501216888428]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 15.0, 18.0, 19.0, 31.0, 55.0, 60.0, 112.0, 165.0, 292.0, 488.0, 802.0, 1608.0, 3453.0, 7611.0, 19401.0, 64143.0, 334190.0, 487238.0, 87056.0, 24677.0, 9005.0, 3875.0, 1897.0, 928.0, 580.0, 320.0, 186.0, 122.0, 69.0, 47.0, 32.0, 21.0, 15.0, 8.0, 2.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5390625, -3.41314697265625, -3.2872314453125, -3.16131591796875, -3.035400390625, -2.90948486328125, -2.7835693359375, -2.65765380859375, -2.53173828125, -2.40582275390625, -2.2799072265625, -2.15399169921875, -2.028076171875, -1.90216064453125, -1.7762451171875, -1.65032958984375, -1.5244140625, -1.39849853515625, -1.2725830078125, -1.14666748046875, -1.020751953125, -0.89483642578125, -0.7689208984375, -0.64300537109375, -0.51708984375, -0.39117431640625, -0.2652587890625, -0.13934326171875, -0.013427734375, 0.11248779296875, 0.2384033203125, 0.36431884765625, 0.490234375, 0.61614990234375, 0.7420654296875, 0.86798095703125, 0.993896484375, 1.11981201171875, 1.2457275390625, 1.37164306640625, 1.49755859375, 1.62347412109375, 1.7493896484375, 1.87530517578125, 2.001220703125, 2.12713623046875, 2.2530517578125, 2.37896728515625, 2.5048828125, 2.63079833984375, 2.7567138671875, 2.88262939453125, 3.008544921875, 3.13446044921875, 3.2603759765625, 3.38629150390625, 3.51220703125, 3.63812255859375, 3.7640380859375, 3.88995361328125, 4.015869140625, 4.14178466796875, 4.2677001953125, 4.39361572265625, 4.51953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 14.0, 13.0, 26.0, 27.0, 28.0, 37.0, 46.0, 76.0, 61.0, 82.0, 66.0, 86.0, 71.0, 76.0, 57.0, 54.0, 44.0, 36.0, 19.0, 13.0, 18.0, 6.0, 6.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.5965576171875, -10.263427734375, -9.9302978515625, -9.59716796875, -9.2640380859375, -8.930908203125, -8.5977783203125, -8.2646484375, -7.9315185546875, -7.598388671875, -7.2652587890625, -6.93212890625, -6.5989990234375, -6.265869140625, -5.9327392578125, -5.599609375, -5.2664794921875, -4.933349609375, -4.6002197265625, -4.26708984375, -3.9339599609375, -3.600830078125, -3.2677001953125, -2.9345703125, -2.6014404296875, -2.268310546875, -1.9351806640625, -1.60205078125, -1.2689208984375, -0.935791015625, -0.6026611328125, -0.26953125, 0.0635986328125, 0.396728515625, 0.7298583984375, 1.06298828125, 1.3961181640625, 1.729248046875, 2.0623779296875, 2.3955078125, 2.7286376953125, 3.061767578125, 3.3948974609375, 3.72802734375, 4.0611572265625, 4.394287109375, 4.7274169921875, 5.060546875, 5.3936767578125, 5.726806640625, 6.0599365234375, 6.39306640625, 6.7261962890625, 7.059326171875, 7.3924560546875, 7.7255859375, 8.0587158203125, 8.391845703125, 8.7249755859375, 9.05810546875, 9.3912353515625, 9.724365234375, 10.0574951171875, 10.390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 2.0, 8.0, 12.0, 20.0, 21.0, 31.0, 53.0, 59.0, 118.0, 226.0, 484.0, 1253.0, 4739.0, 28613.0, 394421.0, 570859.0, 38916.0, 5992.0, 1522.0, 536.0, 264.0, 148.0, 88.0, 51.0, 39.0, 16.0, 26.0, 19.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.466552734375, -4.27294921875, -4.079345703125, -3.8857421875, -3.692138671875, -3.49853515625, -3.304931640625, -3.111328125, -2.917724609375, -2.72412109375, -2.530517578125, -2.3369140625, -2.143310546875, -1.94970703125, -1.756103515625, -1.5625, -1.368896484375, -1.17529296875, -0.981689453125, -0.7880859375, -0.594482421875, -0.40087890625, -0.207275390625, -0.013671875, 0.179931640625, 0.37353515625, 0.567138671875, 0.7607421875, 0.954345703125, 1.14794921875, 1.341552734375, 1.53515625, 1.728759765625, 1.92236328125, 2.115966796875, 2.3095703125, 2.503173828125, 2.69677734375, 2.890380859375, 3.083984375, 3.277587890625, 3.47119140625, 3.664794921875, 3.8583984375, 4.052001953125, 4.24560546875, 4.439208984375, 4.6328125, 4.826416015625, 5.02001953125, 5.213623046875, 5.4072265625, 5.600830078125, 5.79443359375, 5.988037109375, 6.181640625, 6.375244140625, 6.56884765625, 6.762451171875, 6.9560546875, 7.149658203125, 7.34326171875, 7.536865234375, 7.73046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 12.0, 11.0, 19.0, 19.0, 14.0, 21.0, 33.0, 31.0, 38.0, 45.0, 23.0, 28.0, 53.0, 59.0, 59.0, 44.0, 57.0, 48.0, 53.0, 59.0, 36.0, 27.0, 32.0, 26.0, 26.0, 28.0, 15.0, 13.0, 14.0, 13.0, 6.0, 6.0, 3.0, 4.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2308349609375, -9.899169921875, -9.5675048828125, -9.23583984375, -8.9041748046875, -8.572509765625, -8.2408447265625, -7.9091796875, -7.5775146484375, -7.245849609375, -6.9141845703125, -6.58251953125, -6.2508544921875, -5.919189453125, -5.5875244140625, -5.255859375, -4.9241943359375, -4.592529296875, -4.2608642578125, -3.92919921875, -3.5975341796875, -3.265869140625, -2.9342041015625, -2.6025390625, -2.2708740234375, -1.939208984375, -1.6075439453125, -1.27587890625, -0.9442138671875, -0.612548828125, -0.2808837890625, 0.05078125, 0.3824462890625, 0.714111328125, 1.0457763671875, 1.37744140625, 1.7091064453125, 2.040771484375, 2.3724365234375, 2.7041015625, 3.0357666015625, 3.367431640625, 3.6990966796875, 4.03076171875, 4.3624267578125, 4.694091796875, 5.0257568359375, 5.357421875, 5.6890869140625, 6.020751953125, 6.3524169921875, 6.68408203125, 7.0157470703125, 7.347412109375, 7.6790771484375, 8.0107421875, 8.3424072265625, 8.674072265625, 9.0057373046875, 9.33740234375, 9.6690673828125, 10.000732421875, 10.3323974609375, 10.6640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 16.0, 28.0, 91.0, 266.0, 1558.0, 79382.0, 958510.0, 7825.0, 601.0, 149.0, 66.0, 26.0, 16.0, 5.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.27667236328125, -4.1353759765625, -3.99407958984375, -3.852783203125, -3.71148681640625, -3.5701904296875, -3.42889404296875, -3.28759765625, -3.14630126953125, -3.0050048828125, -2.86370849609375, -2.722412109375, -2.58111572265625, -2.4398193359375, -2.29852294921875, -2.1572265625, -2.01593017578125, -1.8746337890625, -1.73333740234375, -1.592041015625, -1.45074462890625, -1.3094482421875, -1.16815185546875, -1.02685546875, -0.88555908203125, -0.7442626953125, -0.60296630859375, -0.461669921875, -0.32037353515625, -0.1790771484375, -0.03778076171875, 0.103515625, 0.24481201171875, 0.3861083984375, 0.52740478515625, 0.668701171875, 0.80999755859375, 0.9512939453125, 1.09259033203125, 1.23388671875, 1.37518310546875, 1.5164794921875, 1.65777587890625, 1.799072265625, 1.94036865234375, 2.0816650390625, 2.22296142578125, 2.3642578125, 2.50555419921875, 2.6468505859375, 2.78814697265625, 2.929443359375, 3.07073974609375, 3.2120361328125, 3.35333251953125, 3.49462890625, 3.63592529296875, 3.7772216796875, 3.91851806640625, 4.059814453125, 4.20111083984375, 4.3424072265625, 4.48370361328125, 4.625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 9.0, 9.0, 16.0, 8.0, 15.0, 12.0, 22.0, 32.0, 33.0, 48.0, 63.0, 63.0, 96.0, 113.0, 96.0, 83.0, 71.0, 53.0, 41.0, 21.0, 23.0, 18.0, 18.0, 16.0, 4.0, 6.0, 6.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013577938079833984, -0.0001304764300584793, -0.00012517347931861877, -0.00011987052857875824, -0.0001145675778388977, -0.00010926462709903717, -0.00010396167635917664, -9.86587256193161e-05, -9.335577487945557e-05, -8.805282413959503e-05, -8.27498733997345e-05, -7.744692265987396e-05, -7.214397192001343e-05, -6.684102118015289e-05, -6.153807044029236e-05, -5.6235119700431824e-05, -5.093216896057129e-05, -4.5629218220710754e-05, -4.032626748085022e-05, -3.5023316740989685e-05, -2.972036600112915e-05, -2.4417415261268616e-05, -1.911446452140808e-05, -1.3811513781547546e-05, -8.508563041687012e-06, -3.205612301826477e-06, 2.0973384380340576e-06, 7.400289177894592e-06, 1.2703239917755127e-05, 1.800619065761566e-05, 2.3309141397476196e-05, 2.861209213733673e-05, 3.3915042877197266e-05, 3.92179936170578e-05, 4.4520944356918335e-05, 4.982389509677887e-05, 5.5126845836639404e-05, 6.042979657649994e-05, 6.573274731636047e-05, 7.103569805622101e-05, 7.633864879608154e-05, 8.164159953594208e-05, 8.694455027580261e-05, 9.224750101566315e-05, 9.755045175552368e-05, 0.00010285340249538422, 0.00010815635323524475, 0.00011345930397510529, 0.00011876225471496582, 0.00012406520545482635, 0.0001293681561946869, 0.00013467110693454742, 0.00013997405767440796, 0.0001452770084142685, 0.00015057995915412903, 0.00015588290989398956, 0.0001611858606338501, 0.00016648881137371063, 0.00017179176211357117, 0.0001770947128534317, 0.00018239766359329224, 0.00018770061433315277, 0.0001930035650730133, 0.00019830651581287384, 0.00020360946655273438]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 25.0, 26.0, 30.0, 68.0, 111.0, 166.0, 334.0, 676.0, 1710.0, 5287.0, 20236.0, 119264.0, 657718.0, 201446.0, 30422.0, 6994.0, 2323.0, 839.0, 348.0, 205.0, 101.0, 75.0, 54.0, 35.0, 15.0, 14.0, 12.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4423828125, -1.3994903564453125, -1.356597900390625, -1.3137054443359375, -1.27081298828125, -1.2279205322265625, -1.185028076171875, -1.1421356201171875, -1.0992431640625, -1.0563507080078125, -1.013458251953125, -0.9705657958984375, -0.92767333984375, -0.8847808837890625, -0.841888427734375, -0.7989959716796875, -0.756103515625, -0.7132110595703125, -0.670318603515625, -0.6274261474609375, -0.58453369140625, -0.5416412353515625, -0.498748779296875, -0.4558563232421875, -0.4129638671875, -0.3700714111328125, -0.327178955078125, -0.2842864990234375, -0.24139404296875, -0.1985015869140625, -0.155609130859375, -0.1127166748046875, -0.06982421875, -0.0269317626953125, 0.015960693359375, 0.0588531494140625, 0.10174560546875, 0.1446380615234375, 0.187530517578125, 0.2304229736328125, 0.2733154296875, 0.3162078857421875, 0.359100341796875, 0.4019927978515625, 0.44488525390625, 0.4877777099609375, 0.530670166015625, 0.5735626220703125, 0.616455078125, 0.6593475341796875, 0.702239990234375, 0.7451324462890625, 0.78802490234375, 0.8309173583984375, 0.873809814453125, 0.9167022705078125, 0.9595947265625, 1.0024871826171875, 1.045379638671875, 1.0882720947265625, 1.13116455078125, 1.1740570068359375, 1.216949462890625, 1.2598419189453125, 1.302734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 1.0, 10.0, 15.0, 20.0, 30.0, 49.0, 59.0, 82.0, 134.0, 164.0, 129.0, 98.0, 77.0, 50.0, 33.0, 19.0, 8.0, 12.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82958984375, -0.8021926879882812, -0.7747955322265625, -0.7473983764648438, -0.720001220703125, -0.6926040649414062, -0.6652069091796875, -0.6378097534179688, -0.61041259765625, -0.5830154418945312, -0.5556182861328125, -0.5282211303710938, -0.500823974609375, -0.47342681884765625, -0.4460296630859375, -0.41863250732421875, -0.3912353515625, -0.36383819580078125, -0.3364410400390625, -0.30904388427734375, -0.281646728515625, -0.25424957275390625, -0.2268524169921875, -0.19945526123046875, -0.17205810546875, -0.14466094970703125, -0.1172637939453125, -0.08986663818359375, -0.062469482421875, -0.03507232666015625, -0.0076751708984375, 0.01972198486328125, 0.047119140625, 0.07451629638671875, 0.1019134521484375, 0.12931060791015625, 0.156707763671875, 0.18410491943359375, 0.2115020751953125, 0.23889923095703125, 0.26629638671875, 0.29369354248046875, 0.3210906982421875, 0.34848785400390625, 0.375885009765625, 0.40328216552734375, 0.4306793212890625, 0.45807647705078125, 0.4854736328125, 0.5128707885742188, 0.5402679443359375, 0.5676651000976562, 0.595062255859375, 0.6224594116210938, 0.6498565673828125, 0.6772537231445312, 0.70465087890625, 0.7320480346679688, 0.7594451904296875, 0.7868423461914062, 0.814239501953125, 0.8416366577148438, 0.8690338134765625, 0.8964309692382812, 0.923828125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 10.0, 16.0, 45.0, 124.0, 269.0, 311.0, 152.0, 47.0, 24.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.645073890686035, -6.574057579040527, -5.503040790557861, -4.432024002075195, -3.3610076904296875, -2.2899913787841797, -1.2189745903015137, -0.14795780181884766, 0.9230585098266602, 1.994075059890747, 3.065091609954834, 4.1361083984375, 5.207124710083008, 6.278141021728516, 7.349157810211182, 8.420174598693848, 9.491190910339355, 10.562207221984863, 11.633224487304688, 12.704240798950195, 13.775257110595703, 14.846273422241211, 15.917289733886719, 16.98830795288086, 18.059322357177734, 19.130338668823242, 20.20135498046875, 21.272371292114258, 22.343387603759766, 23.414405822753906, 24.485422134399414, 25.556438446044922, 26.627452850341797, 27.698469161987305, 28.769485473632812, 29.84050178527832, 30.911518096923828, 31.98253631591797, 33.053550720214844, 34.124568939208984, 35.195587158203125, 36.266605377197266, 37.33761978149414, 38.40863800048828, 39.479652404785156, 40.5506706237793, 41.62168502807617, 42.69270324707031, 43.76371765136719, 44.83473587036133, 45.9057502746582, 46.976768493652344, 48.04778289794922, 49.11880111694336, 50.189815521240234, 51.260833740234375, 52.33184814453125, 53.40286636352539, 54.473880767822266, 55.544898986816406, 56.61591339111328, 57.68693161010742, 58.7579460144043, 59.82896423339844, 60.89998245239258]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 8.0, 0.0, 7.0, 7.0, 11.0, 12.0, 16.0, 12.0, 10.0, 26.0, 26.0, 33.0, 18.0, 26.0, 32.0, 28.0, 33.0, 58.0, 40.0, 51.0, 32.0, 51.0, 54.0, 31.0, 41.0, 46.0, 38.0, 38.0, 30.0, 23.0, 23.0, 35.0, 20.0, 19.0, 8.0, 9.0, 7.0, 17.0, 9.0, 10.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-17.096542358398438, -16.643341064453125, -16.190139770507812, -15.736936569213867, -15.283735275268555, -14.830533981323242, -14.377331733703613, -13.924129486083984, -13.470928192138672, -13.01772689819336, -12.56452465057373, -12.111322402954102, -11.658121109008789, -11.204919815063477, -10.751717567443848, -10.298515319824219, -9.845314025878906, -9.392112731933594, -8.938910484313965, -8.485708236694336, -8.032506942749023, -7.579305171966553, -7.126103401184082, -6.672901630401611, -6.219699859619141, -5.76649808883667, -5.313296318054199, -4.8600945472717285, -4.406892776489258, -3.953691005706787, -3.5004892349243164, -3.0472874641418457, -2.5940847396850586, -2.140882968902588, -1.6876811981201172, -1.2344794273376465, -0.7812776565551758, -0.3280758857727051, 0.12512588500976562, 0.5783276557922363, 1.031529426574707, 1.4847311973571777, 1.9379329681396484, 2.391134738922119, 2.84433650970459, 3.2975382804870605, 3.7507400512695312, 4.203941822052002, 4.657143592834473, 5.110345363616943, 5.563547134399414, 6.016748905181885, 6.4699506759643555, 6.923152446746826, 7.376354217529297, 7.829555988311768, 8.282757759094238, 8.735960006713867, 9.18916130065918, 9.642362594604492, 10.095564842224121, 10.54876708984375, 11.001968383789062, 11.455169677734375, 11.908371925354004]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 18.0, 29.0, 47.0, 87.0, 187.0, 330.0, 667.0, 1896.0, 6278.0, 29272.0, 669266.0, 3379883.0, 90277.0, 11240.0, 2803.0, 1063.0, 409.0, 207.0, 131.0, 58.0, 40.0, 30.0, 19.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -7.9610595703125, -7.586181640625, -7.2113037109375, -6.83642578125, -6.4615478515625, -6.086669921875, -5.7117919921875, -5.3369140625, -4.9620361328125, -4.587158203125, -4.2122802734375, -3.83740234375, -3.4625244140625, -3.087646484375, -2.7127685546875, -2.337890625, -1.9630126953125, -1.588134765625, -1.2132568359375, -0.83837890625, -0.4635009765625, -0.088623046875, 0.2862548828125, 0.6611328125, 1.0360107421875, 1.410888671875, 1.7857666015625, 2.16064453125, 2.5355224609375, 2.910400390625, 3.2852783203125, 3.66015625, 4.0350341796875, 4.409912109375, 4.7847900390625, 5.15966796875, 5.5345458984375, 5.909423828125, 6.2843017578125, 6.6591796875, 7.0340576171875, 7.408935546875, 7.7838134765625, 8.15869140625, 8.5335693359375, 8.908447265625, 9.2833251953125, 9.658203125, 10.0330810546875, 10.407958984375, 10.7828369140625, 11.15771484375, 11.5325927734375, 11.907470703125, 12.2823486328125, 12.6572265625, 13.0321044921875, 13.406982421875, 13.7818603515625, 14.15673828125, 14.5316162109375, 14.906494140625, 15.2813720703125, 15.65625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 17.0, 26.0, 42.0, 40.0, 62.0, 67.0, 77.0, 93.0, 101.0, 107.0, 74.0, 69.0, 63.0, 48.0, 23.0, 32.0, 10.0, 10.0, 9.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3515625, -6.1365966796875, -5.921630859375, -5.7066650390625, -5.49169921875, -5.2767333984375, -5.061767578125, -4.8468017578125, -4.6318359375, -4.4168701171875, -4.201904296875, -3.9869384765625, -3.77197265625, -3.5570068359375, -3.342041015625, -3.1270751953125, -2.912109375, -2.6971435546875, -2.482177734375, -2.2672119140625, -2.05224609375, -1.8372802734375, -1.622314453125, -1.4073486328125, -1.1923828125, -0.9774169921875, -0.762451171875, -0.5474853515625, -0.33251953125, -0.1175537109375, 0.097412109375, 0.3123779296875, 0.52734375, 0.7423095703125, 0.957275390625, 1.1722412109375, 1.38720703125, 1.6021728515625, 1.817138671875, 2.0321044921875, 2.2470703125, 2.4620361328125, 2.677001953125, 2.8919677734375, 3.10693359375, 3.3218994140625, 3.536865234375, 3.7518310546875, 3.966796875, 4.1817626953125, 4.396728515625, 4.6116943359375, 4.82666015625, 5.0416259765625, 5.256591796875, 5.4715576171875, 5.6865234375, 5.9014892578125, 6.116455078125, 6.3314208984375, 6.54638671875, 6.7613525390625, 6.976318359375, 7.1912841796875, 7.40625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 14.0, 15.0, 22.0, 32.0, 62.0, 88.0, 216.0, 493.0, 1394.0, 6163.0, 52155.0, 3349963.0, 753489.0, 24768.0, 3682.0, 955.0, 362.0, 163.0, 70.0, 51.0, 31.0, 19.0, 19.0, 6.0, 5.0, 5.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.29443359375, -9.9248046875, -9.55517578125, -9.185546875, -8.81591796875, -8.4462890625, -8.07666015625, -7.70703125, -7.33740234375, -6.9677734375, -6.59814453125, -6.228515625, -5.85888671875, -5.4892578125, -5.11962890625, -4.75, -4.38037109375, -4.0107421875, -3.64111328125, -3.271484375, -2.90185546875, -2.5322265625, -2.16259765625, -1.79296875, -1.42333984375, -1.0537109375, -0.68408203125, -0.314453125, 0.05517578125, 0.4248046875, 0.79443359375, 1.1640625, 1.53369140625, 1.9033203125, 2.27294921875, 2.642578125, 3.01220703125, 3.3818359375, 3.75146484375, 4.12109375, 4.49072265625, 4.8603515625, 5.22998046875, 5.599609375, 5.96923828125, 6.3388671875, 6.70849609375, 7.078125, 7.44775390625, 7.8173828125, 8.18701171875, 8.556640625, 8.92626953125, 9.2958984375, 9.66552734375, 10.03515625, 10.40478515625, 10.7744140625, 11.14404296875, 11.513671875, 11.88330078125, 12.2529296875, 12.62255859375, 12.9921875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 13.0, 16.0, 22.0, 34.0, 37.0, 59.0, 89.0, 145.0, 250.0, 436.0, 792.0, 849.0, 544.0, 275.0, 169.0, 100.0, 79.0, 46.0, 34.0, 18.0, 16.0, 8.0, 8.0, 9.0, 2.0, 4.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05859375, -1.987762451171875, -1.91693115234375, -1.846099853515625, -1.7752685546875, -1.704437255859375, -1.63360595703125, -1.562774658203125, -1.491943359375, -1.421112060546875, -1.35028076171875, -1.279449462890625, -1.2086181640625, -1.137786865234375, -1.06695556640625, -0.996124267578125, -0.92529296875, -0.854461669921875, -0.78363037109375, -0.712799072265625, -0.6419677734375, -0.571136474609375, -0.50030517578125, -0.429473876953125, -0.358642578125, -0.287811279296875, -0.21697998046875, -0.146148681640625, -0.0753173828125, -0.004486083984375, 0.06634521484375, 0.137176513671875, 0.2080078125, 0.278839111328125, 0.34967041015625, 0.420501708984375, 0.4913330078125, 0.562164306640625, 0.63299560546875, 0.703826904296875, 0.774658203125, 0.845489501953125, 0.91632080078125, 0.987152099609375, 1.0579833984375, 1.128814697265625, 1.19964599609375, 1.270477294921875, 1.34130859375, 1.412139892578125, 1.48297119140625, 1.553802490234375, 1.6246337890625, 1.695465087890625, 1.76629638671875, 1.837127685546875, 1.907958984375, 1.978790283203125, 2.04962158203125, 2.120452880859375, 2.1912841796875, 2.262115478515625, 2.33294677734375, 2.403778076171875, 2.474609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 23.0, 34.0, 60.0, 84.0, 177.0, 193.0, 167.0, 119.0, 77.0, 26.0, 16.0, 13.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.969508171081543, -5.497320652008057, -5.02513313293457, -4.552945137023926, -4.0807576179504395, -3.608570098876953, -3.1363823413848877, -2.6641945838928223, -2.192007064819336, -1.71981942653656, -1.2476317882537842, -0.7754441499710083, -0.3032565116882324, 0.1689310073852539, 0.6411187648773193, 1.1133065223693848, 1.585494041442871, 2.0576815605163574, 2.529869318008423, 3.0020570755004883, 3.4742445945739746, 3.946432113647461, 4.4186201095581055, 4.890807628631592, 5.362995147705078, 5.8351826667785645, 6.307370185852051, 6.779558181762695, 7.251745700836182, 7.723933219909668, 8.196121215820312, 8.66830825805664, 9.140495300292969, 9.612683296203613, 10.084870338439941, 10.557058334350586, 11.029245376586914, 11.501433372497559, 11.973621368408203, 12.445808410644531, 12.917996406555176, 13.39018440246582, 13.862371444702148, 14.334559440612793, 14.806747436523438, 15.278934478759766, 15.75112247467041, 16.223310470581055, 16.695497512817383, 17.16768455505371, 17.639873504638672, 18.112060546875, 18.584247589111328, 19.056434631347656, 19.528623580932617, 20.000810623168945, 20.472999572753906, 20.945186614990234, 21.417375564575195, 21.889562606811523, 22.36174964904785, 22.833938598632812, 23.30612564086914, 23.77831268310547, 24.250499725341797]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 10.0, 11.0, 10.0, 19.0, 24.0, 26.0, 38.0, 45.0, 40.0, 33.0, 61.0, 35.0, 70.0, 67.0, 53.0, 61.0, 55.0, 64.0, 48.0, 44.0, 41.0, 29.0, 24.0, 18.0, 20.0, 16.0, 8.0, 7.0, 10.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.938656806945801, -4.764148235321045, -4.589639663696289, -4.415131092071533, -4.240622520446777, -4.066113471984863, -3.8916049003601074, -3.7170963287353516, -3.5425877571105957, -3.36807918548584, -3.193570613861084, -3.019061803817749, -2.844553232192993, -2.6700446605682373, -2.4955358505249023, -2.3210272789001465, -2.1465187072753906, -1.9720101356506348, -1.7975014448165894, -1.622992753982544, -1.448484182357788, -1.2739756107330322, -1.0994669198989868, -0.9249582290649414, -0.7504496574401855, -0.5759410262107849, -0.4014323949813843, -0.22692376375198364, -0.05241513252258301, 0.12209349870681763, 0.29660212993621826, 0.47111082077026367, 0.6456198692321777, 0.8201285004615784, 0.994637131690979, 1.1691458225250244, 1.3436543941497803, 1.5181629657745361, 1.6926716566085815, 1.867180347442627, 2.041688919067383, 2.2161974906921387, 2.3907060623168945, 2.5652148723602295, 2.7397234439849854, 2.914232015609741, 3.088740825653076, 3.263249397277832, 3.437757968902588, 3.6122665405273438, 3.7867751121520996, 3.9612839221954346, 4.1357927322387695, 4.310301303863525, 4.484809875488281, 4.659318447113037, 4.833827018737793, 5.008335590362549, 5.182844161987305, 5.3573527336120605, 5.531861305236816, 5.7063703536987305, 5.880878925323486, 6.055387496948242, 6.229896068572998]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 8.0, 14.0, 20.0, 28.0, 38.0, 66.0, 121.0, 187.0, 345.0, 676.0, 1224.0, 2621.0, 6033.0, 15705.0, 50563.0, 213755.0, 502354.0, 185350.0, 44557.0, 14248.0, 5638.0, 2447.0, 1168.0, 582.0, 328.0, 161.0, 103.0, 69.0, 39.0, 39.0, 17.0, 12.0, 15.0, 7.0, 2.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.4781341552734375, -1.427947998046875, -1.3777618408203125, -1.32757568359375, -1.2773895263671875, -1.227203369140625, -1.1770172119140625, -1.1268310546875, -1.0766448974609375, -1.026458740234375, -0.9762725830078125, -0.92608642578125, -0.8759002685546875, -0.825714111328125, -0.7755279541015625, -0.725341796875, -0.6751556396484375, -0.624969482421875, -0.5747833251953125, -0.52459716796875, -0.4744110107421875, -0.424224853515625, -0.3740386962890625, -0.3238525390625, -0.2736663818359375, -0.223480224609375, -0.1732940673828125, -0.12310791015625, -0.0729217529296875, -0.022735595703125, 0.0274505615234375, 0.07763671875, 0.1278228759765625, 0.178009033203125, 0.2281951904296875, 0.27838134765625, 0.3285675048828125, 0.378753662109375, 0.4289398193359375, 0.4791259765625, 0.5293121337890625, 0.579498291015625, 0.6296844482421875, 0.67987060546875, 0.7300567626953125, 0.780242919921875, 0.8304290771484375, 0.880615234375, 0.9308013916015625, 0.980987548828125, 1.0311737060546875, 1.08135986328125, 1.1315460205078125, 1.181732177734375, 1.2319183349609375, 1.2821044921875, 1.3322906494140625, 1.382476806640625, 1.4326629638671875, 1.48284912109375, 1.5330352783203125, 1.583221435546875, 1.6334075927734375, 1.68359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 5.0, 9.0, 19.0, 17.0, 28.0, 34.0, 44.0, 45.0, 41.0, 61.0, 87.0, 73.0, 76.0, 64.0, 87.0, 54.0, 54.0, 35.0, 41.0, 27.0, 34.0, 20.0, 15.0, 6.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.304779052734375, -3.17010498046875, -3.035430908203125, -2.9007568359375, -2.766082763671875, -2.63140869140625, -2.496734619140625, -2.362060546875, -2.227386474609375, -2.09271240234375, -1.958038330078125, -1.8233642578125, -1.688690185546875, -1.55401611328125, -1.419342041015625, -1.28466796875, -1.149993896484375, -1.01531982421875, -0.880645751953125, -0.7459716796875, -0.611297607421875, -0.47662353515625, -0.341949462890625, -0.207275390625, -0.072601318359375, 0.06207275390625, 0.196746826171875, 0.3314208984375, 0.466094970703125, 0.60076904296875, 0.735443115234375, 0.8701171875, 1.004791259765625, 1.13946533203125, 1.274139404296875, 1.4088134765625, 1.543487548828125, 1.67816162109375, 1.812835693359375, 1.947509765625, 2.082183837890625, 2.21685791015625, 2.351531982421875, 2.4862060546875, 2.620880126953125, 2.75555419921875, 2.890228271484375, 3.02490234375, 3.159576416015625, 3.29425048828125, 3.428924560546875, 3.5635986328125, 3.698272705078125, 3.83294677734375, 3.967620849609375, 4.102294921875, 4.236968994140625, 4.37164306640625, 4.506317138671875, 4.6409912109375, 4.775665283203125, 4.91033935546875, 5.045013427734375, 5.1796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 8.0, 8.0, 16.0, 24.0, 27.0, 50.0, 71.0, 153.0, 341.0, 696.0, 1866.0, 5506.0, 20801.0, 130774.0, 652388.0, 197260.0, 27712.0, 6939.0, 2217.0, 855.0, 369.0, 177.0, 105.0, 62.0, 27.0, 21.0, 20.0, 10.0, 11.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.05963134765625, -1.9923095703125, -1.92498779296875, -1.857666015625, -1.79034423828125, -1.7230224609375, -1.65570068359375, -1.58837890625, -1.52105712890625, -1.4537353515625, -1.38641357421875, -1.319091796875, -1.25177001953125, -1.1844482421875, -1.11712646484375, -1.0498046875, -0.98248291015625, -0.9151611328125, -0.84783935546875, -0.780517578125, -0.71319580078125, -0.6458740234375, -0.57855224609375, -0.51123046875, -0.44390869140625, -0.3765869140625, -0.30926513671875, -0.241943359375, -0.17462158203125, -0.1072998046875, -0.03997802734375, 0.02734375, 0.09466552734375, 0.1619873046875, 0.22930908203125, 0.296630859375, 0.36395263671875, 0.4312744140625, 0.49859619140625, 0.56591796875, 0.63323974609375, 0.7005615234375, 0.76788330078125, 0.835205078125, 0.90252685546875, 0.9698486328125, 1.03717041015625, 1.1044921875, 1.17181396484375, 1.2391357421875, 1.30645751953125, 1.373779296875, 1.44110107421875, 1.5084228515625, 1.57574462890625, 1.64306640625, 1.71038818359375, 1.7777099609375, 1.84503173828125, 1.912353515625, 1.97967529296875, 2.0469970703125, 2.11431884765625, 2.181640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 7.0, 7.0, 6.0, 9.0, 13.0, 14.0, 15.0, 28.0, 25.0, 28.0, 30.0, 39.0, 37.0, 41.0, 38.0, 45.0, 35.0, 44.0, 41.0, 43.0, 43.0, 39.0, 27.0, 48.0, 37.0, 30.0, 35.0, 30.0, 19.0, 21.0, 20.0, 15.0, 17.0, 18.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-5.25, -5.08636474609375, -4.9227294921875, -4.75909423828125, -4.595458984375, -4.43182373046875, -4.2681884765625, -4.10455322265625, -3.94091796875, -3.77728271484375, -3.6136474609375, -3.45001220703125, -3.286376953125, -3.12274169921875, -2.9591064453125, -2.79547119140625, -2.6318359375, -2.46820068359375, -2.3045654296875, -2.14093017578125, -1.977294921875, -1.81365966796875, -1.6500244140625, -1.48638916015625, -1.32275390625, -1.15911865234375, -0.9954833984375, -0.83184814453125, -0.668212890625, -0.50457763671875, -0.3409423828125, -0.17730712890625, -0.013671875, 0.14996337890625, 0.3135986328125, 0.47723388671875, 0.640869140625, 0.80450439453125, 0.9681396484375, 1.13177490234375, 1.29541015625, 1.45904541015625, 1.6226806640625, 1.78631591796875, 1.949951171875, 2.11358642578125, 2.2772216796875, 2.44085693359375, 2.6044921875, 2.76812744140625, 2.9317626953125, 3.09539794921875, 3.259033203125, 3.42266845703125, 3.5863037109375, 3.74993896484375, 3.91357421875, 4.07720947265625, 4.2408447265625, 4.40447998046875, 4.568115234375, 4.73175048828125, 4.8953857421875, 5.05902099609375, 5.22265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 8.0, 7.0, 15.0, 13.0, 16.0, 18.0, 38.0, 72.0, 113.0, 223.0, 397.0, 796.0, 1691.0, 4230.0, 12216.0, 56211.0, 433256.0, 458150.0, 60073.0, 12889.0, 4432.0, 1847.0, 862.0, 418.0, 209.0, 142.0, 69.0, 37.0, 39.0, 18.0, 11.0, 13.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.8984375, -0.8703765869140625, -0.842315673828125, -0.8142547607421875, -0.78619384765625, -0.7581329345703125, -0.730072021484375, -0.7020111083984375, -0.6739501953125, -0.6458892822265625, -0.617828369140625, -0.5897674560546875, -0.56170654296875, -0.5336456298828125, -0.505584716796875, -0.4775238037109375, -0.449462890625, -0.4214019775390625, -0.393341064453125, -0.3652801513671875, -0.33721923828125, -0.3091583251953125, -0.281097412109375, -0.2530364990234375, -0.2249755859375, -0.1969146728515625, -0.168853759765625, -0.1407928466796875, -0.11273193359375, -0.0846710205078125, -0.056610107421875, -0.0285491943359375, -0.00048828125, 0.0275726318359375, 0.055633544921875, 0.0836944580078125, 0.11175537109375, 0.1398162841796875, 0.167877197265625, 0.1959381103515625, 0.2239990234375, 0.2520599365234375, 0.280120849609375, 0.3081817626953125, 0.33624267578125, 0.3643035888671875, 0.392364501953125, 0.4204254150390625, 0.448486328125, 0.4765472412109375, 0.504608154296875, 0.5326690673828125, 0.56072998046875, 0.5887908935546875, 0.616851806640625, 0.6449127197265625, 0.6729736328125, 0.7010345458984375, 0.729095458984375, 0.7571563720703125, 0.78521728515625, 0.8132781982421875, 0.841339111328125, 0.8694000244140625, 0.8974609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 8.0, 17.0, 18.0, 30.0, 47.0, 47.0, 101.0, 121.0, 129.0, 126.0, 105.0, 58.0, 48.0, 32.0, 18.0, 14.0, 14.0, 11.0, 3.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004360675811767578, -0.0004231072962284088, -0.0004101470112800598, -0.0003971867263317108, -0.0003842264413833618, -0.0003712661564350128, -0.0003583058714866638, -0.0003453455865383148, -0.0003323853015899658, -0.0003194250166416168, -0.0003064647316932678, -0.0002935044467449188, -0.0002805441617965698, -0.0002675838768482208, -0.0002546235918998718, -0.00024166330695152283, -0.00022870302200317383, -0.00021574273705482483, -0.00020278245210647583, -0.00018982216715812683, -0.00017686188220977783, -0.00016390159726142883, -0.00015094131231307983, -0.00013798102736473083, -0.00012502074241638184, -0.00011206045746803284, -9.910017251968384e-05, -8.613988757133484e-05, -7.317960262298584e-05, -6.021931767463684e-05, -4.725903272628784e-05, -3.429874777793884e-05, -2.1338462829589844e-05, -8.378177881240845e-06, 4.582107067108154e-06, 1.7542392015457153e-05, 3.0502676963806152e-05, 4.346296191215515e-05, 5.642324686050415e-05, 6.938353180885315e-05, 8.234381675720215e-05, 9.530410170555115e-05, 0.00010826438665390015, 0.00012122467160224915, 0.00013418495655059814, 0.00014714524149894714, 0.00016010552644729614, 0.00017306581139564514, 0.00018602609634399414, 0.00019898638129234314, 0.00021194666624069214, 0.00022490695118904114, 0.00023786723613739014, 0.00025082752108573914, 0.00026378780603408813, 0.00027674809098243713, 0.00028970837593078613, 0.00030266866087913513, 0.00031562894582748413, 0.00032858923077583313, 0.00034154951572418213, 0.00035450980067253113, 0.0003674700856208801, 0.0003804303705692291, 0.0003933906555175781]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 3.0, 10.0, 6.0, 13.0, 20.0, 30.0, 29.0, 52.0, 79.0, 108.0, 192.0, 301.0, 568.0, 830.0, 1529.0, 2950.0, 5742.0, 12144.0, 29917.0, 82931.0, 262694.0, 397856.0, 160376.0, 52044.0, 19996.0, 8685.0, 4203.0, 2172.0, 1204.0, 673.0, 430.0, 266.0, 159.0, 105.0, 66.0, 61.0, 34.0, 20.0, 14.0, 11.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.60205078125, -0.5854568481445312, -0.5688629150390625, -0.5522689819335938, -0.535675048828125, -0.5190811157226562, -0.5024871826171875, -0.48589324951171875, -0.46929931640625, -0.45270538330078125, -0.4361114501953125, -0.41951751708984375, -0.402923583984375, -0.38632965087890625, -0.3697357177734375, -0.35314178466796875, -0.3365478515625, -0.31995391845703125, -0.3033599853515625, -0.28676605224609375, -0.270172119140625, -0.25357818603515625, -0.2369842529296875, -0.22039031982421875, -0.20379638671875, -0.18720245361328125, -0.1706085205078125, -0.15401458740234375, -0.137420654296875, -0.12082672119140625, -0.1042327880859375, -0.08763885498046875, -0.071044921875, -0.05445098876953125, -0.0378570556640625, -0.02126312255859375, -0.004669189453125, 0.01192474365234375, 0.0285186767578125, 0.04511260986328125, 0.06170654296875, 0.07830047607421875, 0.0948944091796875, 0.11148834228515625, 0.128082275390625, 0.14467620849609375, 0.1612701416015625, 0.17786407470703125, 0.1944580078125, 0.21105194091796875, 0.2276458740234375, 0.24423980712890625, 0.260833740234375, 0.27742767333984375, 0.2940216064453125, 0.31061553955078125, 0.32720947265625, 0.34380340576171875, 0.3603973388671875, 0.37699127197265625, 0.393585205078125, 0.41017913818359375, 0.4267730712890625, 0.44336700439453125, 0.4599609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 5.0, 9.0, 8.0, 9.0, 6.0, 9.0, 16.0, 9.0, 22.0, 26.0, 43.0, 38.0, 40.0, 67.0, 63.0, 57.0, 80.0, 71.0, 78.0, 70.0, 44.0, 48.0, 32.0, 34.0, 16.0, 15.0, 14.0, 12.0, 8.0, 9.0, 8.0, 7.0, 6.0, 4.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.14018630981445312, -0.13498687744140625, -0.12978744506835938, -0.1245880126953125, -0.11938858032226562, -0.11418914794921875, -0.10898971557617188, -0.103790283203125, -0.09859085083007812, -0.09339141845703125, -0.08819198608398438, -0.0829925537109375, -0.07779312133789062, -0.07259368896484375, -0.06739425659179688, -0.06219482421875, -0.056995391845703125, -0.05179595947265625, -0.046596527099609375, -0.0413970947265625, -0.036197662353515625, -0.03099822998046875, -0.025798797607421875, -0.020599365234375, -0.015399932861328125, -0.01020050048828125, -0.005001068115234375, 0.0001983642578125, 0.005397796630859375, 0.01059722900390625, 0.015796661376953125, 0.02099609375, 0.026195526123046875, 0.03139495849609375, 0.036594390869140625, 0.0417938232421875, 0.046993255615234375, 0.05219268798828125, 0.057392120361328125, 0.062591552734375, 0.06779098510742188, 0.07299041748046875, 0.07818984985351562, 0.0833892822265625, 0.08858871459960938, 0.09378814697265625, 0.09898757934570312, 0.10418701171875, 0.10938644409179688, 0.11458587646484375, 0.11978530883789062, 0.1249847412109375, 0.13018417358398438, 0.13538360595703125, 0.14058303833007812, 0.145782470703125, 0.15098190307617188, 0.15618133544921875, 0.16138076782226562, 0.1665802001953125, 0.17177963256835938, 0.17697906494140625, 0.18217849731445312, 0.1873779296875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 23.0, 54.0, 111.0, 244.0, 275.0, 172.0, 68.0, 30.0, 12.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.353297233581543, -7.940892696380615, -7.528488636016846, -7.116084098815918, -6.703680038452148, -6.291275501251221, -5.878870964050293, -5.466466903686523, -5.054062366485596, -4.641657829284668, -4.229253768920898, -3.8168492317199707, -3.404444932937622, -2.9920406341552734, -2.5796360969543457, -2.167231798171997, -1.7548274993896484, -1.3424232006072998, -0.9300187826156616, -0.5176143646240234, -0.1052100658416748, 0.30719423294067383, 0.7195987701416016, 1.1320030689239502, 1.5444073677062988, 1.9568116664886475, 2.369215965270996, 2.781620502471924, 3.1940248012542725, 3.606429100036621, 4.018833637237549, 4.431238174438477, 4.8436431884765625, 5.25604772567749, 5.66845178604126, 6.0808563232421875, 6.493260383605957, 6.905664920806885, 7.3180694580078125, 7.730473518371582, 8.142877578735352, 8.555281639099121, 8.967686653137207, 9.380090713500977, 9.792494773864746, 10.204898834228516, 10.617303848266602, 11.029707908630371, 11.442112922668457, 11.854516983032227, 12.266921997070312, 12.679326057434082, 13.091730117797852, 13.504135131835938, 13.916539192199707, 14.328943252563477, 14.741348266601562, 15.153752326965332, 15.566157341003418, 15.978561401367188, 16.390966415405273, 16.803369522094727, 17.215774536132812, 17.6281795501709, 18.04058265686035]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 3.0, 9.0, 12.0, 19.0, 17.0, 24.0, 39.0, 36.0, 37.0, 51.0, 43.0, 60.0, 70.0, 68.0, 59.0, 66.0, 63.0, 73.0, 50.0, 42.0, 34.0, 30.0, 26.0, 21.0, 11.0, 6.0, 15.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431551694869995, -3.312861919403076, -3.194171905517578, -3.075482130050659, -2.9567923545837402, -2.838102340698242, -2.7194125652313232, -2.6007227897644043, -2.4820327758789062, -2.3633430004119873, -2.2446529865264893, -2.1259632110595703, -2.0072734355926514, -1.8885835409164429, -1.7698936462402344, -1.6512038707733154, -1.5325140953063965, -1.413824200630188, -1.295134425163269, -1.1764445304870605, -1.0577547550201416, -0.9390648603439331, -0.8203749656677246, -0.7016851305961609, -0.5829952955245972, -0.46430546045303345, -0.34561559557914734, -0.22692573070526123, -0.10823589563369751, 0.010453939437866211, 0.1291438341140747, 0.24783366918563843, 0.36652374267578125, 0.48521357774734497, 0.6039034128189087, 0.7225933074951172, 0.8412831425666809, 0.9599729776382446, 1.0786628723144531, 1.197352647781372, 1.3160425424575806, 1.434732437133789, 1.553422212600708, 1.6721121072769165, 1.790802001953125, 1.909491777420044, 2.028181552886963, 2.146871566772461, 2.26556134223938, 2.384251117706299, 2.502941131591797, 2.621630907058716, 2.7403206825256348, 2.859010696411133, 2.9777004718780518, 3.0963902473449707, 3.2150802612304688, 3.3337700366973877, 3.4524600505828857, 3.5711498260498047, 3.6898396015167236, 3.8085293769836426, 3.9272193908691406, 4.045909404754639, 4.1645989418029785]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 8.0, 18.0, 32.0, 59.0, 84.0, 201.0, 384.0, 873.0, 2041.0, 5869.0, 21124.0, 139934.0, 774280.0, 80834.0, 15236.0, 4493.0, 1714.0, 714.0, 313.0, 153.0, 74.0, 52.0, 19.0, 12.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.309326171875, -4.14599609375, -3.982666015625, -3.8193359375, -3.656005859375, -3.49267578125, -3.329345703125, -3.166015625, -3.002685546875, -2.83935546875, -2.676025390625, -2.5126953125, -2.349365234375, -2.18603515625, -2.022705078125, -1.859375, -1.696044921875, -1.53271484375, -1.369384765625, -1.2060546875, -1.042724609375, -0.87939453125, -0.716064453125, -0.552734375, -0.389404296875, -0.22607421875, -0.062744140625, 0.1005859375, 0.263916015625, 0.42724609375, 0.590576171875, 0.75390625, 0.917236328125, 1.08056640625, 1.243896484375, 1.4072265625, 1.570556640625, 1.73388671875, 1.897216796875, 2.060546875, 2.223876953125, 2.38720703125, 2.550537109375, 2.7138671875, 2.877197265625, 3.04052734375, 3.203857421875, 3.3671875, 3.530517578125, 3.69384765625, 3.857177734375, 4.0205078125, 4.183837890625, 4.34716796875, 4.510498046875, 4.673828125, 4.837158203125, 5.00048828125, 5.163818359375, 5.3271484375, 5.490478515625, 5.65380859375, 5.817138671875, 5.98046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 4.0, 12.0, 17.0, 15.0, 18.0, 36.0, 38.0, 37.0, 39.0, 45.0, 63.0, 70.0, 68.0, 63.0, 61.0, 61.0, 67.0, 58.0, 49.0, 37.0, 32.0, 24.0, 25.0, 14.0, 9.0, 10.0, 6.0, 5.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.453125, -7.2071533203125, -6.961181640625, -6.7152099609375, -6.46923828125, -6.2232666015625, -5.977294921875, -5.7313232421875, -5.4853515625, -5.2393798828125, -4.993408203125, -4.7474365234375, -4.50146484375, -4.2554931640625, -4.009521484375, -3.7635498046875, -3.517578125, -3.2716064453125, -3.025634765625, -2.7796630859375, -2.53369140625, -2.2877197265625, -2.041748046875, -1.7957763671875, -1.5498046875, -1.3038330078125, -1.057861328125, -0.8118896484375, -0.56591796875, -0.3199462890625, -0.073974609375, 0.1719970703125, 0.41796875, 0.6639404296875, 0.909912109375, 1.1558837890625, 1.40185546875, 1.6478271484375, 1.893798828125, 2.1397705078125, 2.3857421875, 2.6317138671875, 2.877685546875, 3.1236572265625, 3.36962890625, 3.6156005859375, 3.861572265625, 4.1075439453125, 4.353515625, 4.5994873046875, 4.845458984375, 5.0914306640625, 5.33740234375, 5.5833740234375, 5.829345703125, 6.0753173828125, 6.3212890625, 6.5672607421875, 6.813232421875, 7.0592041015625, 7.30517578125, 7.5511474609375, 7.797119140625, 8.0430908203125, 8.2890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 14.0, 10.0, 17.0, 22.0, 14.0, 15.0, 25.0, 36.0, 62.0, 75.0, 94.0, 211.0, 1007.0, 14149.0, 944753.0, 84540.0, 2729.0, 357.0, 118.0, 59.0, 53.0, 41.0, 22.0, 26.0, 18.0, 14.0, 12.0, 12.0, 13.0, 6.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.1519775390625, -11.780517578125, -11.4090576171875, -11.03759765625, -10.6661376953125, -10.294677734375, -9.9232177734375, -9.5517578125, -9.1802978515625, -8.808837890625, -8.4373779296875, -8.06591796875, -7.6944580078125, -7.322998046875, -6.9515380859375, -6.580078125, -6.2086181640625, -5.837158203125, -5.4656982421875, -5.09423828125, -4.7227783203125, -4.351318359375, -3.9798583984375, -3.6083984375, -3.2369384765625, -2.865478515625, -2.4940185546875, -2.12255859375, -1.7510986328125, -1.379638671875, -1.0081787109375, -0.63671875, -0.2652587890625, 0.106201171875, 0.4776611328125, 0.84912109375, 1.2205810546875, 1.592041015625, 1.9635009765625, 2.3349609375, 2.7064208984375, 3.077880859375, 3.4493408203125, 3.82080078125, 4.1922607421875, 4.563720703125, 4.9351806640625, 5.306640625, 5.6781005859375, 6.049560546875, 6.4210205078125, 6.79248046875, 7.1639404296875, 7.535400390625, 7.9068603515625, 8.2783203125, 8.6497802734375, 9.021240234375, 9.3927001953125, 9.76416015625, 10.1356201171875, 10.507080078125, 10.8785400390625, 11.25]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 8.0, 6.0, 21.0, 14.0, 21.0, 19.0, 23.0, 28.0, 42.0, 41.0, 63.0, 69.0, 57.0, 57.0, 68.0, 56.0, 54.0, 46.0, 52.0, 48.0, 46.0, 34.0, 23.0, 24.0, 14.0, 11.0, 15.0, 7.0, 7.0, 7.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.4765625, -11.1708984375, -10.865234375, -10.5595703125, -10.25390625, -9.9482421875, -9.642578125, -9.3369140625, -9.03125, -8.7255859375, -8.419921875, -8.1142578125, -7.80859375, -7.5029296875, -7.197265625, -6.8916015625, -6.5859375, -6.2802734375, -5.974609375, -5.6689453125, -5.36328125, -5.0576171875, -4.751953125, -4.4462890625, -4.140625, -3.8349609375, -3.529296875, -3.2236328125, -2.91796875, -2.6123046875, -2.306640625, -2.0009765625, -1.6953125, -1.3896484375, -1.083984375, -0.7783203125, -0.47265625, -0.1669921875, 0.138671875, 0.4443359375, 0.75, 1.0556640625, 1.361328125, 1.6669921875, 1.97265625, 2.2783203125, 2.583984375, 2.8896484375, 3.1953125, 3.5009765625, 3.806640625, 4.1123046875, 4.41796875, 4.7236328125, 5.029296875, 5.3349609375, 5.640625, 5.9462890625, 6.251953125, 6.5576171875, 6.86328125, 7.1689453125, 7.474609375, 7.7802734375, 8.0859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 3.0, 7.0, 14.0, 9.0, 23.0, 15.0, 39.0, 78.0, 118.0, 272.0, 636.0, 1613.0, 5837.0, 35926.0, 578901.0, 387689.0, 29707.0, 5147.0, 1418.0, 567.0, 226.0, 138.0, 67.0, 23.0, 33.0, 13.0, 6.0, 8.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.55078125, -1.497222900390625, -1.44366455078125, -1.390106201171875, -1.3365478515625, -1.282989501953125, -1.22943115234375, -1.175872802734375, -1.122314453125, -1.068756103515625, -1.01519775390625, -0.961639404296875, -0.9080810546875, -0.854522705078125, -0.80096435546875, -0.747406005859375, -0.69384765625, -0.640289306640625, -0.58673095703125, -0.533172607421875, -0.4796142578125, -0.426055908203125, -0.37249755859375, -0.318939208984375, -0.265380859375, -0.211822509765625, -0.15826416015625, -0.104705810546875, -0.0511474609375, 0.002410888671875, 0.05596923828125, 0.109527587890625, 0.1630859375, 0.216644287109375, 0.27020263671875, 0.323760986328125, 0.3773193359375, 0.430877685546875, 0.48443603515625, 0.537994384765625, 0.591552734375, 0.645111083984375, 0.69866943359375, 0.752227783203125, 0.8057861328125, 0.859344482421875, 0.91290283203125, 0.966461181640625, 1.02001953125, 1.073577880859375, 1.12713623046875, 1.180694580078125, 1.2342529296875, 1.287811279296875, 1.34136962890625, 1.394927978515625, 1.448486328125, 1.502044677734375, 1.55560302734375, 1.609161376953125, 1.6627197265625, 1.716278076171875, 1.76983642578125, 1.823394775390625, 1.876953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 1.0, 6.0, 8.0, 8.0, 11.0, 10.0, 19.0, 28.0, 35.0, 58.0, 69.0, 85.0, 113.0, 153.0, 97.0, 70.0, 62.0, 34.0, 29.0, 22.0, 24.0, 14.0, 4.0, 6.0, 5.0, 1.0, 5.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001690387725830078, -0.00016345083713531494, -0.00015786290168762207, -0.0001522749662399292, -0.00014668703079223633, -0.00014109909534454346, -0.00013551115989685059, -0.00012992322444915771, -0.00012433528900146484, -0.00011874735355377197, -0.0001131594181060791, -0.00010757148265838623, -0.00010198354721069336, -9.639561176300049e-05, -9.080767631530762e-05, -8.521974086761475e-05, -7.963180541992188e-05, -7.4043869972229e-05, -6.845593452453613e-05, -6.286799907684326e-05, -5.728006362915039e-05, -5.169212818145752e-05, -4.610419273376465e-05, -4.051625728607178e-05, -3.4928321838378906e-05, -2.9340386390686035e-05, -2.3752450942993164e-05, -1.8164515495300293e-05, -1.2576580047607422e-05, -6.988644599914551e-06, -1.4007091522216797e-06, 4.187226295471191e-06, 9.775161743164062e-06, 1.5363097190856934e-05, 2.0951032638549805e-05, 2.6538968086242676e-05, 3.212690353393555e-05, 3.771483898162842e-05, 4.330277442932129e-05, 4.889070987701416e-05, 5.447864532470703e-05, 6.00665807723999e-05, 6.565451622009277e-05, 7.124245166778564e-05, 7.683038711547852e-05, 8.241832256317139e-05, 8.800625801086426e-05, 9.359419345855713e-05, 9.918212890625e-05, 0.00010477006435394287, 0.00011035799980163574, 0.00011594593524932861, 0.00012153387069702148, 0.00012712180614471436, 0.00013270974159240723, 0.0001382976770401001, 0.00014388561248779297, 0.00014947354793548584, 0.0001550614833831787, 0.00016064941883087158, 0.00016623735427856445, 0.00017182528972625732, 0.0001774132251739502, 0.00018300116062164307, 0.00018858909606933594]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 11.0, 8.0, 15.0, 18.0, 32.0, 41.0, 119.0, 200.0, 439.0, 917.0, 2277.0, 6734.0, 27668.0, 169963.0, 711719.0, 101295.0, 18737.0, 4976.0, 1826.0, 752.0, 373.0, 181.0, 111.0, 48.0, 31.0, 21.0, 9.0, 8.0, 11.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7548828125, -1.7103118896484375, -1.665740966796875, -1.6211700439453125, -1.57659912109375, -1.5320281982421875, -1.487457275390625, -1.4428863525390625, -1.3983154296875, -1.3537445068359375, -1.309173583984375, -1.2646026611328125, -1.22003173828125, -1.1754608154296875, -1.130889892578125, -1.0863189697265625, -1.041748046875, -0.9971771240234375, -0.952606201171875, -0.9080352783203125, -0.86346435546875, -0.8188934326171875, -0.774322509765625, -0.7297515869140625, -0.6851806640625, -0.6406097412109375, -0.596038818359375, -0.5514678955078125, -0.50689697265625, -0.4623260498046875, -0.417755126953125, -0.3731842041015625, -0.32861328125, -0.2840423583984375, -0.239471435546875, -0.1949005126953125, -0.15032958984375, -0.1057586669921875, -0.061187744140625, -0.0166168212890625, 0.0279541015625, 0.0725250244140625, 0.117095947265625, 0.1616668701171875, 0.20623779296875, 0.2508087158203125, 0.295379638671875, 0.3399505615234375, 0.384521484375, 0.4290924072265625, 0.473663330078125, 0.5182342529296875, 0.56280517578125, 0.6073760986328125, 0.651947021484375, 0.6965179443359375, 0.7410888671875, 0.7856597900390625, 0.830230712890625, 0.8748016357421875, 0.91937255859375, 0.9639434814453125, 1.008514404296875, 1.0530853271484375, 1.09765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 5.0, 1.0, 11.0, 9.0, 12.0, 15.0, 24.0, 22.0, 26.0, 41.0, 51.0, 73.0, 101.0, 147.0, 128.0, 76.0, 49.0, 50.0, 36.0, 24.0, 19.0, 7.0, 12.0, 10.0, 5.0, 7.0, 13.0, 6.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.466796875, -0.44869232177734375, -0.4305877685546875, -0.41248321533203125, -0.394378662109375, -0.37627410888671875, -0.3581695556640625, -0.34006500244140625, -0.32196044921875, -0.30385589599609375, -0.2857513427734375, -0.26764678955078125, -0.249542236328125, -0.23143768310546875, -0.2133331298828125, -0.19522857666015625, -0.1771240234375, -0.15901947021484375, -0.1409149169921875, -0.12281036376953125, -0.104705810546875, -0.08660125732421875, -0.0684967041015625, -0.05039215087890625, -0.03228759765625, -0.01418304443359375, 0.0039215087890625, 0.02202606201171875, 0.040130615234375, 0.05823516845703125, 0.0763397216796875, 0.09444427490234375, 0.112548828125, 0.13065338134765625, 0.1487579345703125, 0.16686248779296875, 0.184967041015625, 0.20307159423828125, 0.2211761474609375, 0.23928070068359375, 0.25738525390625, 0.27548980712890625, 0.2935943603515625, 0.31169891357421875, 0.329803466796875, 0.34790802001953125, 0.3660125732421875, 0.38411712646484375, 0.4022216796875, 0.42032623291015625, 0.4384307861328125, 0.45653533935546875, 0.474639892578125, 0.49274444580078125, 0.5108489990234375, 0.5289535522460938, 0.54705810546875, 0.5651626586914062, 0.5832672119140625, 0.6013717651367188, 0.619476318359375, 0.6375808715820312, 0.6556854248046875, 0.6737899780273438, 0.69189453125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 10.0, 13.0, 30.0, 65.0, 104.0, 166.0, 225.0, 162.0, 102.0, 64.0, 33.0, 14.0, 4.0, 4.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.068559646606445, -7.428589820861816, -6.788619518280029, -6.148649215698242, -5.508679389953613, -4.868709564208984, -4.228739261627197, -3.58876895904541, -2.9487991333007812, -2.3088290691375732, -1.6688590049743652, -1.0288889408111572, -0.3889188766479492, 0.2510511875152588, 0.8910212516784668, 1.530991554260254, 2.170961380004883, 2.810931444168091, 3.450901508331299, 4.090871810913086, 4.730841636657715, 5.370811462402344, 6.010781764984131, 6.650752067565918, 7.290721893310547, 7.930691719055176, 8.570661544799805, 9.21063232421875, 9.850602149963379, 10.490571975708008, 11.130542755126953, 11.770512580871582, 12.410484313964844, 13.050454139709473, 13.690423965454102, 14.330394744873047, 14.970364570617676, 15.610334396362305, 16.25030517578125, 16.890274047851562, 17.530244827270508, 18.170215606689453, 18.810184478759766, 19.45015525817871, 20.090126037597656, 20.73009490966797, 21.370065689086914, 22.01003646850586, 22.650005340576172, 23.289976119995117, 23.92994499206543, 24.569915771484375, 25.209884643554688, 25.849855422973633, 26.489826202392578, 27.12979507446289, 27.769765853881836, 28.40973663330078, 29.049705505371094, 29.68967628479004, 30.329647064208984, 30.969615936279297, 31.609586715698242, 32.24955749511719, 32.8895263671875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 5.0, 12.0, 11.0, 19.0, 13.0, 23.0, 29.0, 23.0, 15.0, 26.0, 29.0, 30.0, 31.0, 28.0, 41.0, 32.0, 34.0, 40.0, 35.0, 38.0, 43.0, 51.0, 25.0, 51.0, 27.0, 48.0, 35.0, 33.0, 16.0, 17.0, 23.0, 23.0, 15.0, 16.0, 8.0, 9.0, 8.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-11.097710609436035, -10.776701927185059, -10.455692291259766, -10.134683609008789, -9.813674926757812, -9.492666244506836, -9.171656608581543, -8.850647926330566, -8.52963924407959, -8.208630561828613, -7.8876214027404785, -7.566612243652344, -7.245603561401367, -6.924594402313232, -6.603585243225098, -6.282576560974121, -5.961567401885986, -5.640558242797852, -5.319549560546875, -4.99854040145874, -4.677531719207764, -4.356522560119629, -4.035513877868652, -3.7145047187805176, -3.393495798110962, -3.0724868774414062, -2.7514779567718506, -2.430469036102295, -2.10945987701416, -1.788451075553894, -1.4674420356750488, -1.1464331150054932, -0.8254241943359375, -0.5044152736663818, -0.1834062933921814, 0.13760268688201904, 0.4586116075515747, 0.7796205282211304, 1.1006295680999756, 1.4216384887695312, 1.742647409439087, 2.0636563301086426, 2.3846652507781982, 2.705674171447754, 3.0266833305358887, 3.3476920127868652, 3.668701171875, 3.9897100925445557, 4.310719013214111, 4.631728172302246, 4.952736854553223, 5.273746013641357, 5.594754695892334, 5.915763854980469, 6.236772537231445, 6.55778169631958, 6.878790855407715, 7.19980001449585, 7.520808696746826, 7.841817855834961, 8.162826538085938, 8.483835220336914, 8.804844856262207, 9.125853538513184, 9.44686222076416]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 0.0, 9.0, 12.0, 10.0, 7.0, 11.0, 28.0, 21.0, 52.0, 40.0, 79.0, 169.0, 327.0, 739.0, 2360.0, 9398.0, 68413.0, 3539895.0, 544538.0, 21809.0, 4085.0, 1244.0, 425.0, 200.0, 128.0, 61.0, 42.0, 35.0, 18.0, 19.0, 27.0, 15.0, 15.0, 13.0, 10.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.1953125, -10.819091796875, -10.44287109375, -10.066650390625, -9.6904296875, -9.314208984375, -8.93798828125, -8.561767578125, -8.185546875, -7.809326171875, -7.43310546875, -7.056884765625, -6.6806640625, -6.304443359375, -5.92822265625, -5.552001953125, -5.17578125, -4.799560546875, -4.42333984375, -4.047119140625, -3.6708984375, -3.294677734375, -2.91845703125, -2.542236328125, -2.166015625, -1.789794921875, -1.41357421875, -1.037353515625, -0.6611328125, -0.284912109375, 0.09130859375, 0.467529296875, 0.84375, 1.219970703125, 1.59619140625, 1.972412109375, 2.3486328125, 2.724853515625, 3.10107421875, 3.477294921875, 3.853515625, 4.229736328125, 4.60595703125, 4.982177734375, 5.3583984375, 5.734619140625, 6.11083984375, 6.487060546875, 6.86328125, 7.239501953125, 7.61572265625, 7.991943359375, 8.3681640625, 8.744384765625, 9.12060546875, 9.496826171875, 9.873046875, 10.249267578125, 10.62548828125, 11.001708984375, 11.3779296875, 11.754150390625, 12.13037109375, 12.506591796875, 12.8828125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 1.0, 7.0, 20.0, 20.0, 14.0, 35.0, 41.0, 49.0, 55.0, 89.0, 79.0, 94.0, 99.0, 68.0, 96.0, 57.0, 56.0, 34.0, 33.0, 22.0, 15.0, 11.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.17327880859375, -3.9910888671875, -3.80889892578125, -3.626708984375, -3.44451904296875, -3.2623291015625, -3.08013916015625, -2.89794921875, -2.71575927734375, -2.5335693359375, -2.35137939453125, -2.169189453125, -1.98699951171875, -1.8048095703125, -1.62261962890625, -1.4404296875, -1.25823974609375, -1.0760498046875, -0.89385986328125, -0.711669921875, -0.52947998046875, -0.3472900390625, -0.16510009765625, 0.01708984375, 0.19927978515625, 0.3814697265625, 0.56365966796875, 0.745849609375, 0.92803955078125, 1.1102294921875, 1.29241943359375, 1.474609375, 1.65679931640625, 1.8389892578125, 2.02117919921875, 2.203369140625, 2.38555908203125, 2.5677490234375, 2.74993896484375, 2.93212890625, 3.11431884765625, 3.2965087890625, 3.47869873046875, 3.660888671875, 3.84307861328125, 4.0252685546875, 4.20745849609375, 4.3896484375, 4.57183837890625, 4.7540283203125, 4.93621826171875, 5.118408203125, 5.30059814453125, 5.4827880859375, 5.66497802734375, 5.84716796875, 6.02935791015625, 6.2115478515625, 6.39373779296875, 6.575927734375, 6.75811767578125, 6.9403076171875, 7.12249755859375, 7.3046875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 13.0, 10.0, 17.0, 18.0, 33.0, 44.0, 67.0, 168.0, 334.0, 852.0, 3478.0, 24247.0, 927796.0, 3187272.0, 42934.0, 5043.0, 1139.0, 383.0, 160.0, 87.0, 50.0, 35.0, 26.0, 15.0, 9.0, 10.0, 8.0, 6.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.2890625, -10.9375, -10.5859375, -10.234375, -9.8828125, -9.53125, -9.1796875, -8.828125, -8.4765625, -8.125, -7.7734375, -7.421875, -7.0703125, -6.71875, -6.3671875, -6.015625, -5.6640625, -5.3125, -4.9609375, -4.609375, -4.2578125, -3.90625, -3.5546875, -3.203125, -2.8515625, -2.5, -2.1484375, -1.796875, -1.4453125, -1.09375, -0.7421875, -0.390625, -0.0390625, 0.3125, 0.6640625, 1.015625, 1.3671875, 1.71875, 2.0703125, 2.421875, 2.7734375, 3.125, 3.4765625, 3.828125, 4.1796875, 4.53125, 4.8828125, 5.234375, 5.5859375, 5.9375, 6.2890625, 6.640625, 6.9921875, 7.34375, 7.6953125, 8.046875, 8.3984375, 8.75, 9.1015625, 9.453125, 9.8046875, 10.15625, 10.5078125, 10.859375, 11.2109375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 10.0, 14.0, 17.0, 26.0, 34.0, 48.0, 55.0, 100.0, 170.0, 256.0, 470.0, 730.0, 822.0, 497.0, 295.0, 147.0, 115.0, 77.0, 49.0, 32.0, 24.0, 18.0, 8.0, 14.0, 11.0, 3.0, 1.0, 9.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.869140625, -1.8108062744140625, -1.752471923828125, -1.6941375732421875, -1.63580322265625, -1.5774688720703125, -1.519134521484375, -1.4608001708984375, -1.4024658203125, -1.3441314697265625, -1.285797119140625, -1.2274627685546875, -1.16912841796875, -1.1107940673828125, -1.052459716796875, -0.9941253662109375, -0.935791015625, -0.8774566650390625, -0.819122314453125, -0.7607879638671875, -0.70245361328125, -0.6441192626953125, -0.585784912109375, -0.5274505615234375, -0.4691162109375, -0.4107818603515625, -0.352447509765625, -0.2941131591796875, -0.23577880859375, -0.1774444580078125, -0.119110107421875, -0.0607757568359375, -0.00244140625, 0.0558929443359375, 0.114227294921875, 0.1725616455078125, 0.23089599609375, 0.2892303466796875, 0.347564697265625, 0.4058990478515625, 0.4642333984375, 0.5225677490234375, 0.580902099609375, 0.6392364501953125, 0.69757080078125, 0.7559051513671875, 0.814239501953125, 0.8725738525390625, 0.930908203125, 0.9892425537109375, 1.047576904296875, 1.1059112548828125, 1.16424560546875, 1.2225799560546875, 1.280914306640625, 1.3392486572265625, 1.3975830078125, 1.4559173583984375, 1.514251708984375, 1.5725860595703125, 1.63092041015625, 1.6892547607421875, 1.747589111328125, 1.8059234619140625, 1.8642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 12.0, 31.0, 71.0, 152.0, 265.0, 213.0, 158.0, 59.0, 31.0, 14.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1069159507751465, -4.539866924285889, -3.972817897796631, -3.405768871307373, -2.8387198448181152, -2.2716708183288574, -1.7046217918395996, -1.1375727653503418, -0.570523738861084, -0.003474712371826172, 0.5635743141174316, 1.1306233406066895, 1.6976723670959473, 2.264721393585205, 2.831770420074463, 3.3988194465637207, 3.9658684730529785, 4.532917499542236, 5.099966526031494, 5.667015552520752, 6.23406457901001, 6.801113605499268, 7.368162631988525, 7.935211658477783, 8.502260208129883, 9.06930923461914, 9.636358261108398, 10.203407287597656, 10.770456314086914, 11.337505340576172, 11.90455436706543, 12.471603393554688, 13.038652420043945, 13.605701446533203, 14.172750473022461, 14.739799499511719, 15.306848526000977, 15.873897552490234, 16.440946578979492, 17.00799560546875, 17.575044631958008, 18.142093658447266, 18.709142684936523, 19.27619171142578, 19.84324073791504, 20.410289764404297, 20.977338790893555, 21.544387817382812, 22.11143684387207, 22.678485870361328, 23.245534896850586, 23.812583923339844, 24.3796329498291, 24.94668197631836, 25.513731002807617, 26.080780029296875, 26.647829055786133, 27.21487808227539, 27.78192710876465, 28.348976135253906, 28.916025161743164, 29.483074188232422, 30.05012321472168, 30.617172241210938, 31.184221267700195]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 11.0, 15.0, 15.0, 21.0, 31.0, 28.0, 33.0, 26.0, 44.0, 59.0, 67.0, 45.0, 61.0, 64.0, 64.0, 58.0, 57.0, 51.0, 45.0, 37.0, 34.0, 27.0, 25.0, 23.0, 17.0, 14.0, 11.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30944299697876, -4.143120288848877, -3.976797342300415, -3.810474395751953, -3.6441516876220703, -3.4778289794921875, -3.3115060329437256, -3.1451830863952637, -2.978860378265381, -2.812537670135498, -2.646214723587036, -2.479891777038574, -2.3135690689086914, -2.1472463607788086, -1.9809234142303467, -1.8146005868911743, -1.648277759552002, -1.4819549322128296, -1.3156321048736572, -1.1493092775344849, -0.9829864501953125, -0.8166636228561401, -0.6503407955169678, -0.4840179681777954, -0.31769514083862305, -0.15137231349945068, 0.01495051383972168, 0.18127334117889404, 0.3475961685180664, 0.5139189958572388, 0.6802418231964111, 0.8465646505355835, 1.012887954711914, 1.1792107820510864, 1.3455336093902588, 1.5118564367294312, 1.6781792640686035, 1.8445020914077759, 2.0108249187469482, 2.17714786529541, 2.343470573425293, 2.509793281555176, 2.6761162281036377, 2.8424391746520996, 3.0087618827819824, 3.1750845909118652, 3.341407537460327, 3.507730484008789, 3.674053192138672, 3.8403759002685547, 4.0066986083984375, 4.1730217933654785, 4.339344501495361, 4.505667209625244, 4.671990394592285, 4.838313102722168, 5.004635810852051, 5.170958518981934, 5.337281227111816, 5.503604412078857, 5.66992712020874, 5.836249828338623, 6.002573013305664, 6.168895721435547, 6.33521842956543]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 7.0, 16.0, 14.0, 17.0, 48.0, 51.0, 104.0, 145.0, 299.0, 552.0, 1125.0, 2336.0, 5536.0, 15172.0, 60381.0, 382348.0, 473440.0, 77392.0, 18279.0, 6091.0, 2599.0, 1248.0, 601.0, 315.0, 168.0, 91.0, 54.0, 39.0, 30.0, 14.0, 14.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.73046875, -1.664093017578125, -1.59771728515625, -1.531341552734375, -1.4649658203125, -1.398590087890625, -1.33221435546875, -1.265838623046875, -1.199462890625, -1.133087158203125, -1.06671142578125, -1.000335693359375, -0.9339599609375, -0.867584228515625, -0.80120849609375, -0.734832763671875, -0.66845703125, -0.602081298828125, -0.53570556640625, -0.469329833984375, -0.4029541015625, -0.336578369140625, -0.27020263671875, -0.203826904296875, -0.137451171875, -0.071075439453125, -0.00469970703125, 0.061676025390625, 0.1280517578125, 0.194427490234375, 0.26080322265625, 0.327178955078125, 0.3935546875, 0.459930419921875, 0.52630615234375, 0.592681884765625, 0.6590576171875, 0.725433349609375, 0.79180908203125, 0.858184814453125, 0.924560546875, 0.990936279296875, 1.05731201171875, 1.123687744140625, 1.1900634765625, 1.256439208984375, 1.32281494140625, 1.389190673828125, 1.45556640625, 1.521942138671875, 1.58831787109375, 1.654693603515625, 1.7210693359375, 1.787445068359375, 1.85382080078125, 1.920196533203125, 1.986572265625, 2.052947998046875, 2.11932373046875, 2.185699462890625, 2.2520751953125, 2.318450927734375, 2.38482666015625, 2.451202392578125, 2.517578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 7.0, 11.0, 9.0, 27.0, 10.0, 29.0, 21.0, 27.0, 28.0, 36.0, 44.0, 38.0, 45.0, 42.0, 47.0, 49.0, 46.0, 53.0, 38.0, 53.0, 46.0, 37.0, 44.0, 26.0, 30.0, 26.0, 23.0, 24.0, 13.0, 12.0, 17.0, 10.0, 8.0, 3.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.841796875, -2.74908447265625, -2.6563720703125, -2.56365966796875, -2.470947265625, -2.37823486328125, -2.2855224609375, -2.19281005859375, -2.10009765625, -2.00738525390625, -1.9146728515625, -1.82196044921875, -1.729248046875, -1.63653564453125, -1.5438232421875, -1.45111083984375, -1.3583984375, -1.26568603515625, -1.1729736328125, -1.08026123046875, -0.987548828125, -0.89483642578125, -0.8021240234375, -0.70941162109375, -0.61669921875, -0.52398681640625, -0.4312744140625, -0.33856201171875, -0.245849609375, -0.15313720703125, -0.0604248046875, 0.03228759765625, 0.125, 0.21771240234375, 0.3104248046875, 0.40313720703125, 0.495849609375, 0.58856201171875, 0.6812744140625, 0.77398681640625, 0.86669921875, 0.95941162109375, 1.0521240234375, 1.14483642578125, 1.237548828125, 1.33026123046875, 1.4229736328125, 1.51568603515625, 1.6083984375, 1.70111083984375, 1.7938232421875, 1.88653564453125, 1.979248046875, 2.07196044921875, 2.1646728515625, 2.25738525390625, 2.35009765625, 2.44281005859375, 2.5355224609375, 2.62823486328125, 2.720947265625, 2.81365966796875, 2.9063720703125, 2.99908447265625, 3.091796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 6.0, 3.0, 14.0, 14.0, 12.0, 23.0, 25.0, 54.0, 86.0, 120.0, 256.0, 468.0, 1028.0, 2283.0, 6130.0, 19711.0, 92958.0, 525844.0, 325907.0, 53407.0, 12681.0, 4174.0, 1669.0, 778.0, 365.0, 206.0, 94.0, 68.0, 48.0, 35.0, 22.0, 19.0, 16.0, 7.0, 8.0, 2.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8447265625, -1.788543701171875, -1.73236083984375, -1.676177978515625, -1.6199951171875, -1.563812255859375, -1.50762939453125, -1.451446533203125, -1.395263671875, -1.339080810546875, -1.28289794921875, -1.226715087890625, -1.1705322265625, -1.114349365234375, -1.05816650390625, -1.001983642578125, -0.94580078125, -0.889617919921875, -0.83343505859375, -0.777252197265625, -0.7210693359375, -0.664886474609375, -0.60870361328125, -0.552520751953125, -0.496337890625, -0.440155029296875, -0.38397216796875, -0.327789306640625, -0.2716064453125, -0.215423583984375, -0.15924072265625, -0.103057861328125, -0.046875, 0.009307861328125, 0.06549072265625, 0.121673583984375, 0.1778564453125, 0.234039306640625, 0.29022216796875, 0.346405029296875, 0.402587890625, 0.458770751953125, 0.51495361328125, 0.571136474609375, 0.6273193359375, 0.683502197265625, 0.73968505859375, 0.795867919921875, 0.85205078125, 0.908233642578125, 0.96441650390625, 1.020599365234375, 1.0767822265625, 1.132965087890625, 1.18914794921875, 1.245330810546875, 1.301513671875, 1.357696533203125, 1.41387939453125, 1.470062255859375, 1.5262451171875, 1.582427978515625, 1.63861083984375, 1.694793701171875, 1.7509765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 10.0, 6.0, 1.0, 11.0, 11.0, 10.0, 17.0, 16.0, 16.0, 22.0, 20.0, 23.0, 23.0, 42.0, 35.0, 29.0, 43.0, 39.0, 40.0, 51.0, 47.0, 45.0, 43.0, 33.0, 36.0, 32.0, 27.0, 35.0, 36.0, 41.0, 29.0, 18.0, 22.0, 12.0, 15.0, 20.0, 13.0, 9.0, 5.0, 4.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.83203125, -5.65875244140625, -5.4854736328125, -5.31219482421875, -5.138916015625, -4.96563720703125, -4.7923583984375, -4.61907958984375, -4.44580078125, -4.27252197265625, -4.0992431640625, -3.92596435546875, -3.752685546875, -3.57940673828125, -3.4061279296875, -3.23284912109375, -3.0595703125, -2.88629150390625, -2.7130126953125, -2.53973388671875, -2.366455078125, -2.19317626953125, -2.0198974609375, -1.84661865234375, -1.67333984375, -1.50006103515625, -1.3267822265625, -1.15350341796875, -0.980224609375, -0.80694580078125, -0.6336669921875, -0.46038818359375, -0.287109375, -0.11383056640625, 0.0594482421875, 0.23272705078125, 0.406005859375, 0.57928466796875, 0.7525634765625, 0.92584228515625, 1.09912109375, 1.27239990234375, 1.4456787109375, 1.61895751953125, 1.792236328125, 1.96551513671875, 2.1387939453125, 2.31207275390625, 2.4853515625, 2.65863037109375, 2.8319091796875, 3.00518798828125, 3.178466796875, 3.35174560546875, 3.5250244140625, 3.69830322265625, 3.87158203125, 4.04486083984375, 4.2181396484375, 4.39141845703125, 4.564697265625, 4.73797607421875, 4.9112548828125, 5.08453369140625, 5.2578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 16.0, 15.0, 23.0, 32.0, 56.0, 84.0, 133.0, 222.0, 421.0, 722.0, 1475.0, 3831.0, 12283.0, 78021.0, 712814.0, 207021.0, 21939.0, 5477.0, 2002.0, 863.0, 437.0, 264.0, 127.0, 82.0, 45.0, 40.0, 16.0, 23.0, 14.0, 3.0, 5.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84912109375, -0.8184585571289062, -0.7877960205078125, -0.7571334838867188, -0.726470947265625, -0.6958084106445312, -0.6651458740234375, -0.6344833374023438, -0.60382080078125, -0.5731582641601562, -0.5424957275390625, -0.5118331909179688, -0.481170654296875, -0.45050811767578125, -0.4198455810546875, -0.38918304443359375, -0.3585205078125, -0.32785797119140625, -0.2971954345703125, -0.26653289794921875, -0.235870361328125, -0.20520782470703125, -0.1745452880859375, -0.14388275146484375, -0.11322021484375, -0.08255767822265625, -0.0518951416015625, -0.02123260498046875, 0.009429931640625, 0.04009246826171875, 0.0707550048828125, 0.10141754150390625, 0.132080078125, 0.16274261474609375, 0.1934051513671875, 0.22406768798828125, 0.254730224609375, 0.28539276123046875, 0.3160552978515625, 0.34671783447265625, 0.37738037109375, 0.40804290771484375, 0.4387054443359375, 0.46936798095703125, 0.500030517578125, 0.5306930541992188, 0.5613555908203125, 0.5920181274414062, 0.6226806640625, 0.6533432006835938, 0.6840057373046875, 0.7146682739257812, 0.745330810546875, 0.7759933471679688, 0.8066558837890625, 0.8373184204101562, 0.86798095703125, 0.8986434936523438, 0.9293060302734375, 0.9599685668945312, 0.990631103515625, 1.0212936401367188, 1.0519561767578125, 1.0826187133789062, 1.11328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 5.0, 8.0, 16.0, 19.0, 29.0, 54.0, 50.0, 116.0, 159.0, 157.0, 135.0, 78.0, 56.0, 39.0, 22.0, 13.0, 14.0, 6.0, 4.0, 8.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004048347473144531, -0.00039149075746536255, -0.00037814676761627197, -0.0003648027777671814, -0.0003514587879180908, -0.00033811479806900024, -0.00032477080821990967, -0.0003114268183708191, -0.0002980828285217285, -0.00028473883867263794, -0.00027139484882354736, -0.0002580508589744568, -0.0002447068691253662, -0.00023136287927627563, -0.00021801888942718506, -0.00020467489957809448, -0.0001913309097290039, -0.00017798691987991333, -0.00016464293003082275, -0.00015129894018173218, -0.0001379549503326416, -0.00012461096048355103, -0.00011126697063446045, -9.792298078536987e-05, -8.45789909362793e-05, -7.123500108718872e-05, -5.7891011238098145e-05, -4.454702138900757e-05, -3.120303153991699e-05, -1.7859041690826416e-05, -4.51505184173584e-06, 8.828938007354736e-06, 2.2172927856445312e-05, 3.551691770553589e-05, 4.8860907554626465e-05, 6.220489740371704e-05, 7.554888725280762e-05, 8.88928771018982e-05, 0.00010223686695098877, 0.00011558085680007935, 0.00012892484664916992, 0.0001422688364982605, 0.00015561282634735107, 0.00016895681619644165, 0.00018230080604553223, 0.0001956447958946228, 0.00020898878574371338, 0.00022233277559280396, 0.00023567676544189453, 0.0002490207552909851, 0.0002623647451400757, 0.00027570873498916626, 0.00028905272483825684, 0.0003023967146873474, 0.000315740704536438, 0.00032908469438552856, 0.00034242868423461914, 0.0003557726740837097, 0.0003691166639328003, 0.00038246065378189087, 0.00039580464363098145, 0.000409148633480072, 0.0004224926233291626, 0.0004358366131782532, 0.00044918060302734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 4.0, 5.0, 13.0, 20.0, 28.0, 63.0, 72.0, 126.0, 221.0, 416.0, 873.0, 1783.0, 4962.0, 19568.0, 205694.0, 738420.0, 60793.0, 9824.0, 3003.0, 1261.0, 610.0, 311.0, 194.0, 99.0, 66.0, 29.0, 31.0, 17.0, 8.0, 4.0, 6.0, 3.0, 1.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3876953125, -1.3472137451171875, -1.306732177734375, -1.2662506103515625, -1.22576904296875, -1.1852874755859375, -1.144805908203125, -1.1043243408203125, -1.0638427734375, -1.0233612060546875, -0.982879638671875, -0.9423980712890625, -0.90191650390625, -0.8614349365234375, -0.820953369140625, -0.7804718017578125, -0.739990234375, -0.6995086669921875, -0.659027099609375, -0.6185455322265625, -0.57806396484375, -0.5375823974609375, -0.497100830078125, -0.4566192626953125, -0.4161376953125, -0.3756561279296875, -0.335174560546875, -0.2946929931640625, -0.25421142578125, -0.2137298583984375, -0.173248291015625, -0.1327667236328125, -0.09228515625, -0.0518035888671875, -0.011322021484375, 0.0291595458984375, 0.06964111328125, 0.1101226806640625, 0.150604248046875, 0.1910858154296875, 0.2315673828125, 0.2720489501953125, 0.312530517578125, 0.3530120849609375, 0.39349365234375, 0.4339752197265625, 0.474456787109375, 0.5149383544921875, 0.555419921875, 0.5959014892578125, 0.636383056640625, 0.6768646240234375, 0.71734619140625, 0.7578277587890625, 0.798309326171875, 0.8387908935546875, 0.8792724609375, 0.9197540283203125, 0.960235595703125, 1.0007171630859375, 1.04119873046875, 1.0816802978515625, 1.122161865234375, 1.1626434326171875, 1.203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 4.0, 12.0, 7.0, 15.0, 23.0, 26.0, 47.0, 74.0, 79.0, 152.0, 161.0, 125.0, 72.0, 54.0, 51.0, 23.0, 8.0, 16.0, 10.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.358642578125, -0.3481559753417969, -0.33766937255859375, -0.3271827697753906, -0.3166961669921875, -0.3062095642089844, -0.29572296142578125, -0.2852363586425781, -0.274749755859375, -0.2642631530761719, -0.25377655029296875, -0.24328994750976562, -0.2328033447265625, -0.22231674194335938, -0.21183013916015625, -0.20134353637695312, -0.19085693359375, -0.18037033081054688, -0.16988372802734375, -0.15939712524414062, -0.1489105224609375, -0.13842391967773438, -0.12793731689453125, -0.11745071411132812, -0.106964111328125, -0.09647750854492188, -0.08599090576171875, -0.07550430297851562, -0.0650177001953125, -0.054531097412109375, -0.04404449462890625, -0.033557891845703125, -0.0230712890625, -0.012584686279296875, -0.00209808349609375, 0.008388519287109375, 0.0188751220703125, 0.029361724853515625, 0.03984832763671875, 0.050334930419921875, 0.060821533203125, 0.07130813598632812, 0.08179473876953125, 0.09228134155273438, 0.1027679443359375, 0.11325454711914062, 0.12374114990234375, 0.13422775268554688, 0.14471435546875, 0.15520095825195312, 0.16568756103515625, 0.17617416381835938, 0.1866607666015625, 0.19714736938476562, 0.20763397216796875, 0.21812057495117188, 0.228607177734375, 0.23909378051757812, 0.24958038330078125, 0.2600669860839844, 0.2705535888671875, 0.2810401916503906, 0.29152679443359375, 0.3020133972167969, 0.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 10.0, 19.0, 37.0, 78.0, 118.0, 207.0, 183.0, 148.0, 97.0, 51.0, 35.0, 13.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6614701747894287, -3.362987995147705, -3.0645058155059814, -2.766023635864258, -2.4675416946411133, -2.1690592765808105, -1.870577335357666, -1.5720951557159424, -1.2736129760742188, -0.9751307964324951, -0.6766486763954163, -0.3781665563583374, -0.07968437671661377, 0.21879780292510986, 0.517279863357544, 0.8157620429992676, 1.1142442226409912, 1.4127264022827148, 1.7112085819244385, 2.009690761566162, 2.3081727027893066, 2.6066551208496094, 2.905137062072754, 3.2036192417144775, 3.502101421356201, 3.800583600997925, 4.099065780639648, 4.397547721862793, 4.696030139923096, 4.99451208114624, 5.292994499206543, 5.5914764404296875, 5.889959335327148, 6.188441276550293, 6.486923694610596, 6.78540563583374, 7.083888053894043, 7.3823699951171875, 7.680851936340332, 7.979334354400635, 8.277816772460938, 8.576298713684082, 8.874780654907227, 9.173263549804688, 9.471745491027832, 9.770227432250977, 10.068709373474121, 10.367191314697266, 10.665674209594727, 10.964156150817871, 11.262638092041016, 11.561120986938477, 11.859602928161621, 12.158084869384766, 12.45656681060791, 12.755048751831055, 13.0535306930542, 13.352012634277344, 13.650494575500488, 13.94897747039795, 14.247459411621094, 14.545941352844238, 14.844423294067383, 15.142906188964844, 15.441388130187988]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 8.0, 10.0, 10.0, 16.0, 27.0, 31.0, 21.0, 33.0, 44.0, 39.0, 53.0, 60.0, 63.0, 58.0, 64.0, 61.0, 54.0, 40.0, 51.0, 40.0, 49.0, 43.0, 31.0, 19.0, 19.0, 17.0, 9.0, 7.0, 6.0, 9.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.212761878967285, -3.0995283126831055, -2.986294746398926, -2.873061180114746, -2.7598276138305664, -2.6465940475463867, -2.533360481262207, -2.4201269149780273, -2.3068933486938477, -2.193659782409668, -2.0804262161254883, -1.9671926498413086, -1.853959083557129, -1.7407255172729492, -1.6274919509887695, -1.5142583847045898, -1.4010248184204102, -1.2877912521362305, -1.1745576858520508, -1.061324119567871, -0.9480905532836914, -0.8348569869995117, -0.721623420715332, -0.6083898544311523, -0.49515628814697266, -0.38192272186279297, -0.2686891555786133, -0.1554555892944336, -0.042222023010253906, 0.07101154327392578, 0.18424510955810547, 0.29747867584228516, 0.41071224212646484, 0.5239458084106445, 0.6371793746948242, 0.7504129409790039, 0.8636465072631836, 0.9768800735473633, 1.090113639831543, 1.2033472061157227, 1.3165807723999023, 1.429814338684082, 1.5430479049682617, 1.6562814712524414, 1.769515037536621, 1.8827486038208008, 1.9959821701049805, 2.10921573638916, 2.22244930267334, 2.3356828689575195, 2.448916435241699, 2.562150001525879, 2.6753835678100586, 2.7886171340942383, 2.901850700378418, 3.0150842666625977, 3.1283178329467773, 3.241551399230957, 3.3547849655151367, 3.4680185317993164, 3.581252098083496, 3.694485664367676, 3.8077192306518555, 3.920952796936035, 4.034186363220215]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 14.0, 16.0, 25.0, 50.0, 57.0, 118.0, 176.0, 326.0, 548.0, 972.0, 2039.0, 4121.0, 9805.0, 27851.0, 107261.0, 630072.0, 198398.0, 41998.0, 13746.0, 5504.0, 2586.0, 1276.0, 673.0, 376.0, 190.0, 117.0, 90.0, 45.0, 31.0, 26.0, 13.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.140289306640625, -3.01300048828125, -2.885711669921875, -2.7584228515625, -2.631134033203125, -2.50384521484375, -2.376556396484375, -2.249267578125, -2.121978759765625, -1.99468994140625, -1.867401123046875, -1.7401123046875, -1.612823486328125, -1.48553466796875, -1.358245849609375, -1.23095703125, -1.103668212890625, -0.97637939453125, -0.849090576171875, -0.7218017578125, -0.594512939453125, -0.46722412109375, -0.339935302734375, -0.212646484375, -0.085357666015625, 0.04193115234375, 0.169219970703125, 0.2965087890625, 0.423797607421875, 0.55108642578125, 0.678375244140625, 0.8056640625, 0.932952880859375, 1.06024169921875, 1.187530517578125, 1.3148193359375, 1.442108154296875, 1.56939697265625, 1.696685791015625, 1.823974609375, 1.951263427734375, 2.07855224609375, 2.205841064453125, 2.3331298828125, 2.460418701171875, 2.58770751953125, 2.714996337890625, 2.84228515625, 2.969573974609375, 3.09686279296875, 3.224151611328125, 3.3514404296875, 3.478729248046875, 3.60601806640625, 3.733306884765625, 3.860595703125, 3.987884521484375, 4.11517333984375, 4.242462158203125, 4.3697509765625, 4.497039794921875, 4.62432861328125, 4.751617431640625, 4.87890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 9.0, 7.0, 6.0, 13.0, 12.0, 24.0, 13.0, 15.0, 27.0, 29.0, 28.0, 39.0, 40.0, 52.0, 52.0, 46.0, 66.0, 39.0, 64.0, 45.0, 49.0, 38.0, 41.0, 35.0, 39.0, 31.0, 37.0, 21.0, 19.0, 13.0, 11.0, 9.0, 6.0, 7.0, 6.0, 4.0, 10.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12890625, -4.94940185546875, -4.7698974609375, -4.59039306640625, -4.410888671875, -4.23138427734375, -4.0518798828125, -3.87237548828125, -3.69287109375, -3.51336669921875, -3.3338623046875, -3.15435791015625, -2.974853515625, -2.79534912109375, -2.6158447265625, -2.43634033203125, -2.2568359375, -2.07733154296875, -1.8978271484375, -1.71832275390625, -1.538818359375, -1.35931396484375, -1.1798095703125, -1.00030517578125, -0.82080078125, -0.64129638671875, -0.4617919921875, -0.28228759765625, -0.102783203125, 0.07672119140625, 0.2562255859375, 0.43572998046875, 0.615234375, 0.79473876953125, 0.9742431640625, 1.15374755859375, 1.333251953125, 1.51275634765625, 1.6922607421875, 1.87176513671875, 2.05126953125, 2.23077392578125, 2.4102783203125, 2.58978271484375, 2.769287109375, 2.94879150390625, 3.1282958984375, 3.30780029296875, 3.4873046875, 3.66680908203125, 3.8463134765625, 4.02581787109375, 4.205322265625, 4.38482666015625, 4.5643310546875, 4.74383544921875, 4.92333984375, 5.10284423828125, 5.2823486328125, 5.46185302734375, 5.641357421875, 5.82086181640625, 6.0003662109375, 6.17987060546875, 6.359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 11.0, 5.0, 6.0, 8.0, 10.0, 11.0, 17.0, 26.0, 24.0, 41.0, 54.0, 74.0, 106.0, 150.0, 271.0, 530.0, 1887.0, 9229.0, 126679.0, 863685.0, 38547.0, 4792.0, 1188.0, 454.0, 214.0, 131.0, 94.0, 62.0, 61.0, 41.0, 33.0, 19.0, 23.0, 15.0, 14.0, 10.0, 8.0, 9.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.0234375, -8.7525634765625, -8.481689453125, -8.2108154296875, -7.93994140625, -7.6690673828125, -7.398193359375, -7.1273193359375, -6.8564453125, -6.5855712890625, -6.314697265625, -6.0438232421875, -5.77294921875, -5.5020751953125, -5.231201171875, -4.9603271484375, -4.689453125, -4.4185791015625, -4.147705078125, -3.8768310546875, -3.60595703125, -3.3350830078125, -3.064208984375, -2.7933349609375, -2.5224609375, -2.2515869140625, -1.980712890625, -1.7098388671875, -1.43896484375, -1.1680908203125, -0.897216796875, -0.6263427734375, -0.35546875, -0.0845947265625, 0.186279296875, 0.4571533203125, 0.72802734375, 0.9989013671875, 1.269775390625, 1.5406494140625, 1.8115234375, 2.0823974609375, 2.353271484375, 2.6241455078125, 2.89501953125, 3.1658935546875, 3.436767578125, 3.7076416015625, 3.978515625, 4.2493896484375, 4.520263671875, 4.7911376953125, 5.06201171875, 5.3328857421875, 5.603759765625, 5.8746337890625, 6.1455078125, 6.4163818359375, 6.687255859375, 6.9581298828125, 7.22900390625, 7.4998779296875, 7.770751953125, 8.0416259765625, 8.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 8.0, 2.0, 11.0, 12.0, 16.0, 17.0, 18.0, 16.0, 27.0, 24.0, 26.0, 38.0, 39.0, 42.0, 43.0, 53.0, 44.0, 52.0, 59.0, 58.0, 49.0, 45.0, 38.0, 31.0, 36.0, 28.0, 24.0, 29.0, 21.0, 15.0, 19.0, 9.0, 9.0, 7.0, 6.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.77734375, -7.5662841796875, -7.355224609375, -7.1441650390625, -6.93310546875, -6.7220458984375, -6.510986328125, -6.2999267578125, -6.0888671875, -5.8778076171875, -5.666748046875, -5.4556884765625, -5.24462890625, -5.0335693359375, -4.822509765625, -4.6114501953125, -4.400390625, -4.1893310546875, -3.978271484375, -3.7672119140625, -3.55615234375, -3.3450927734375, -3.134033203125, -2.9229736328125, -2.7119140625, -2.5008544921875, -2.289794921875, -2.0787353515625, -1.86767578125, -1.6566162109375, -1.445556640625, -1.2344970703125, -1.0234375, -0.8123779296875, -0.601318359375, -0.3902587890625, -0.17919921875, 0.0318603515625, 0.242919921875, 0.4539794921875, 0.6650390625, 0.8760986328125, 1.087158203125, 1.2982177734375, 1.50927734375, 1.7203369140625, 1.931396484375, 2.1424560546875, 2.353515625, 2.5645751953125, 2.775634765625, 2.9866943359375, 3.19775390625, 3.4088134765625, 3.619873046875, 3.8309326171875, 4.0419921875, 4.2530517578125, 4.464111328125, 4.6751708984375, 4.88623046875, 5.0972900390625, 5.308349609375, 5.5194091796875, 5.73046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 4.0, 4.0, 7.0, 9.0, 9.0, 23.0, 30.0, 73.0, 157.0, 345.0, 1085.0, 4884.0, 43713.0, 837706.0, 146643.0, 11032.0, 1905.0, 483.0, 177.0, 109.0, 49.0, 26.0, 22.0, 17.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.09375, -2.0277099609375, -1.961669921875, -1.8956298828125, -1.82958984375, -1.7635498046875, -1.697509765625, -1.6314697265625, -1.5654296875, -1.4993896484375, -1.433349609375, -1.3673095703125, -1.30126953125, -1.2352294921875, -1.169189453125, -1.1031494140625, -1.037109375, -0.9710693359375, -0.905029296875, -0.8389892578125, -0.77294921875, -0.7069091796875, -0.640869140625, -0.5748291015625, -0.5087890625, -0.4427490234375, -0.376708984375, -0.3106689453125, -0.24462890625, -0.1785888671875, -0.112548828125, -0.0465087890625, 0.01953125, 0.0855712890625, 0.151611328125, 0.2176513671875, 0.28369140625, 0.3497314453125, 0.415771484375, 0.4818115234375, 0.5478515625, 0.6138916015625, 0.679931640625, 0.7459716796875, 0.81201171875, 0.8780517578125, 0.944091796875, 1.0101318359375, 1.076171875, 1.1422119140625, 1.208251953125, 1.2742919921875, 1.34033203125, 1.4063720703125, 1.472412109375, 1.5384521484375, 1.6044921875, 1.6705322265625, 1.736572265625, 1.8026123046875, 1.86865234375, 1.9346923828125, 2.000732421875, 2.0667724609375, 2.1328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 7.0, 10.0, 13.0, 7.0, 14.0, 18.0, 25.0, 48.0, 71.0, 90.0, 118.0, 154.0, 107.0, 82.0, 56.0, 51.0, 35.0, 25.0, 13.0, 7.0, 9.0, 3.0, 7.0, 4.0, 3.0, 6.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021648406982421875, -0.000210542231798172, -0.00020460039377212524, -0.0001986585557460785, -0.00019271671772003174, -0.00018677487969398499, -0.00018083304166793823, -0.00017489120364189148, -0.00016894936561584473, -0.00016300752758979797, -0.00015706568956375122, -0.00015112385153770447, -0.00014518201351165771, -0.00013924017548561096, -0.0001332983374595642, -0.00012735649943351746, -0.0001214146614074707, -0.00011547282338142395, -0.0001095309853553772, -0.00010358914732933044, -9.764730930328369e-05, -9.170547127723694e-05, -8.576363325119019e-05, -7.982179522514343e-05, -7.387995719909668e-05, -6.793811917304993e-05, -6.199628114700317e-05, -5.605444312095642e-05, -5.011260509490967e-05, -4.4170767068862915e-05, -3.822892904281616e-05, -3.228709101676941e-05, -2.6345252990722656e-05, -2.0403414964675903e-05, -1.446157693862915e-05, -8.519738912582397e-06, -2.5779008865356445e-06, 3.3639371395111084e-06, 9.305775165557861e-06, 1.5247613191604614e-05, 2.1189451217651367e-05, 2.713128924369812e-05, 3.307312726974487e-05, 3.9014965295791626e-05, 4.495680332183838e-05, 5.089864134788513e-05, 5.6840479373931885e-05, 6.278231739997864e-05, 6.872415542602539e-05, 7.466599345207214e-05, 8.06078314781189e-05, 8.654966950416565e-05, 9.24915075302124e-05, 9.843334555625916e-05, 0.00010437518358230591, 0.00011031702160835266, 0.00011625885963439941, 0.00012220069766044617, 0.00012814253568649292, 0.00013408437371253967, 0.00014002621173858643, 0.00014596804976463318, 0.00015190988779067993, 0.00015785172581672668, 0.00016379356384277344]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 12.0, 11.0, 22.0, 40.0, 64.0, 130.0, 276.0, 602.0, 1564.0, 5575.0, 37345.0, 701559.0, 275838.0, 19770.0, 3685.0, 1136.0, 487.0, 206.0, 90.0, 44.0, 26.0, 20.0, 12.0, 4.0, 7.0, 4.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3279266357421875, -1.264251708984375, -1.2005767822265625, -1.13690185546875, -1.0732269287109375, -1.009552001953125, -0.9458770751953125, -0.8822021484375, -0.8185272216796875, -0.754852294921875, -0.6911773681640625, -0.62750244140625, -0.5638275146484375, -0.500152587890625, -0.4364776611328125, -0.372802734375, -0.3091278076171875, -0.245452880859375, -0.1817779541015625, -0.11810302734375, -0.0544281005859375, 0.009246826171875, 0.0729217529296875, 0.1365966796875, 0.2002716064453125, 0.263946533203125, 0.3276214599609375, 0.39129638671875, 0.4549713134765625, 0.518646240234375, 0.5823211669921875, 0.64599609375, 0.7096710205078125, 0.773345947265625, 0.8370208740234375, 0.90069580078125, 0.9643707275390625, 1.028045654296875, 1.0917205810546875, 1.1553955078125, 1.2190704345703125, 1.282745361328125, 1.3464202880859375, 1.41009521484375, 1.4737701416015625, 1.537445068359375, 1.6011199951171875, 1.664794921875, 1.7284698486328125, 1.792144775390625, 1.8558197021484375, 1.91949462890625, 1.9831695556640625, 2.046844482421875, 2.1105194091796875, 2.1741943359375, 2.2378692626953125, 2.301544189453125, 2.3652191162109375, 2.42889404296875, 2.4925689697265625, 2.556243896484375, 2.6199188232421875, 2.68359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 2.0, 14.0, 12.0, 13.0, 14.0, 32.0, 36.0, 48.0, 64.0, 98.0, 160.0, 145.0, 83.0, 78.0, 61.0, 43.0, 13.0, 14.0, 17.0, 11.0, 5.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74609375, -0.725372314453125, -0.70465087890625, -0.683929443359375, -0.6632080078125, -0.642486572265625, -0.62176513671875, -0.601043701171875, -0.580322265625, -0.559600830078125, -0.53887939453125, -0.518157958984375, -0.4974365234375, -0.476715087890625, -0.45599365234375, -0.435272216796875, -0.41455078125, -0.393829345703125, -0.37310791015625, -0.352386474609375, -0.3316650390625, -0.310943603515625, -0.29022216796875, -0.269500732421875, -0.248779296875, -0.228057861328125, -0.20733642578125, -0.186614990234375, -0.1658935546875, -0.145172119140625, -0.12445068359375, -0.103729248046875, -0.0830078125, -0.062286376953125, -0.04156494140625, -0.020843505859375, -0.0001220703125, 0.020599365234375, 0.04132080078125, 0.062042236328125, 0.082763671875, 0.103485107421875, 0.12420654296875, 0.144927978515625, 0.1656494140625, 0.186370849609375, 0.20709228515625, 0.227813720703125, 0.24853515625, 0.269256591796875, 0.28997802734375, 0.310699462890625, 0.3314208984375, 0.352142333984375, 0.37286376953125, 0.393585205078125, 0.414306640625, 0.435028076171875, 0.45574951171875, 0.476470947265625, 0.4971923828125, 0.517913818359375, 0.53863525390625, 0.559356689453125, 0.580078125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 28.0, 35.0, 112.0, 162.0, 196.0, 177.0, 132.0, 77.0, 40.0, 17.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.770491600036621, -11.17680835723877, -10.583126068115234, -9.989442825317383, -9.395759582519531, -8.80207633972168, -8.208393096923828, -7.614710807800293, -7.021027565002441, -6.42734432220459, -5.8336615562438965, -5.239978790283203, -4.646295547485352, -4.0526123046875, -3.4589295387268066, -2.8652467727661133, -2.2715635299682617, -1.6778805255889893, -1.0841975212097168, -0.49051451683044434, 0.10316848754882812, 0.6968514919281006, 1.290534496307373, 1.8842172622680664, 2.477900505065918, 3.0715835094451904, 3.665266513824463, 4.258949279785156, 4.852632522583008, 5.446315765380859, 6.039998531341553, 6.633681297302246, 7.227365493774414, 7.821048736572266, 8.414731979370117, 9.008414268493652, 9.602097511291504, 10.195780754089355, 10.78946304321289, 11.383146286010742, 11.976829528808594, 12.570512771606445, 13.164196014404297, 13.757878303527832, 14.351561546325684, 14.945244789123535, 15.53892707824707, 16.132610321044922, 16.726293563842773, 17.319976806640625, 17.913660049438477, 18.507343292236328, 19.101024627685547, 19.6947078704834, 20.28839111328125, 20.8820743560791, 21.475757598876953, 22.069440841674805, 22.663124084472656, 23.256807327270508, 23.85049057006836, 24.444171905517578, 25.03785514831543, 25.63153839111328, 26.225221633911133]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 3.0, 10.0, 6.0, 7.0, 9.0, 13.0, 18.0, 12.0, 15.0, 20.0, 23.0, 26.0, 26.0, 25.0, 24.0, 26.0, 33.0, 35.0, 28.0, 37.0, 36.0, 40.0, 37.0, 44.0, 42.0, 37.0, 29.0, 45.0, 27.0, 37.0, 36.0, 33.0, 16.0, 24.0, 17.0, 19.0, 16.0, 11.0, 7.0, 12.0, 12.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.163599967956543, -8.86579704284668, -8.567995071411133, -8.27019214630127, -7.972389221191406, -7.674586772918701, -7.376784324645996, -7.078981399536133, -6.781178951263428, -6.483376502990723, -6.185573577880859, -5.887771129608154, -5.589968681335449, -5.292165756225586, -4.994363307952881, -4.696560859680176, -4.3987579345703125, -4.100955486297607, -3.803152561187744, -3.505350112915039, -3.207547426223755, -2.9097447395324707, -2.6119422912597656, -2.3141396045684814, -2.0163369178771973, -1.718534231185913, -1.4207316637039185, -1.1229290962219238, -0.8251264095306396, -0.5273237228393555, -0.22952115535736084, 0.06828141212463379, 0.36608409881591797, 0.6638867259025574, 0.9616893529891968, 1.2594919204711914, 1.5572946071624756, 1.8550972938537598, 2.152899742126465, 2.450702428817749, 2.748505115509033, 3.0463078022003174, 3.3441104888916016, 3.6419129371643066, 3.939715623855591, 4.237518310546875, 4.53532075881958, 4.833123207092285, 5.130926132202148, 5.4287285804748535, 5.726531505584717, 6.024333953857422, 6.322136878967285, 6.61993932723999, 6.917741775512695, 7.215544700622559, 7.513347148895264, 7.811149597167969, 8.108952522277832, 8.406755447387695, 8.704557418823242, 9.002360343933105, 9.300163269042969, 9.597965240478516, 9.895768165588379]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 3.0, 10.0, 11.0, 9.0, 18.0, 26.0, 45.0, 49.0, 59.0, 78.0, 103.0, 150.0, 187.0, 283.0, 463.0, 815.0, 1643.0, 4532.0, 17460.0, 160075.0, 3535865.0, 434870.0, 26862.0, 5877.0, 2200.0, 933.0, 496.0, 334.0, 217.0, 150.0, 113.0, 82.0, 62.0, 58.0, 33.0, 41.0, 18.0, 17.0, 12.0, 11.0, 3.0, 0.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.671875, -7.4129638671875, -7.154052734375, -6.8951416015625, -6.63623046875, -6.3773193359375, -6.118408203125, -5.8594970703125, -5.6005859375, -5.3416748046875, -5.082763671875, -4.8238525390625, -4.56494140625, -4.3060302734375, -4.047119140625, -3.7882080078125, -3.529296875, -3.2703857421875, -3.011474609375, -2.7525634765625, -2.49365234375, -2.2347412109375, -1.975830078125, -1.7169189453125, -1.4580078125, -1.1990966796875, -0.940185546875, -0.6812744140625, -0.42236328125, -0.1634521484375, 0.095458984375, 0.3543701171875, 0.61328125, 0.8721923828125, 1.131103515625, 1.3900146484375, 1.64892578125, 1.9078369140625, 2.166748046875, 2.4256591796875, 2.6845703125, 2.9434814453125, 3.202392578125, 3.4613037109375, 3.72021484375, 3.9791259765625, 4.238037109375, 4.4969482421875, 4.755859375, 5.0147705078125, 5.273681640625, 5.5325927734375, 5.79150390625, 6.0504150390625, 6.309326171875, 6.5682373046875, 6.8271484375, 7.0860595703125, 7.344970703125, 7.6038818359375, 7.86279296875, 8.1217041015625, 8.380615234375, 8.6395263671875, 8.8984375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 13.0, 12.0, 13.0, 15.0, 24.0, 29.0, 29.0, 47.0, 49.0, 49.0, 63.0, 59.0, 80.0, 66.0, 69.0, 60.0, 59.0, 48.0, 39.0, 41.0, 30.0, 26.0, 26.0, 18.0, 12.0, 10.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44140625, -3.30987548828125, -3.1783447265625, -3.04681396484375, -2.915283203125, -2.78375244140625, -2.6522216796875, -2.52069091796875, -2.38916015625, -2.25762939453125, -2.1260986328125, -1.99456787109375, -1.863037109375, -1.73150634765625, -1.5999755859375, -1.46844482421875, -1.3369140625, -1.20538330078125, -1.0738525390625, -0.94232177734375, -0.810791015625, -0.67926025390625, -0.5477294921875, -0.41619873046875, -0.28466796875, -0.15313720703125, -0.0216064453125, 0.10992431640625, 0.241455078125, 0.37298583984375, 0.5045166015625, 0.63604736328125, 0.767578125, 0.89910888671875, 1.0306396484375, 1.16217041015625, 1.293701171875, 1.42523193359375, 1.5567626953125, 1.68829345703125, 1.81982421875, 1.95135498046875, 2.0828857421875, 2.21441650390625, 2.345947265625, 2.47747802734375, 2.6090087890625, 2.74053955078125, 2.8720703125, 3.00360107421875, 3.1351318359375, 3.26666259765625, 3.398193359375, 3.52972412109375, 3.6612548828125, 3.79278564453125, 3.92431640625, 4.05584716796875, 4.1873779296875, 4.31890869140625, 4.450439453125, 4.58197021484375, 4.7135009765625, 4.84503173828125, 4.9765625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 7.0, 3.0, 3.0, 6.0, 7.0, 7.0, 16.0, 17.0, 47.0, 46.0, 96.0, 243.0, 841.0, 5869.0, 415903.0, 3753847.0, 15232.0, 1417.0, 362.0, 129.0, 71.0, 35.0, 24.0, 19.0, 12.0, 12.0, 7.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.685302734375, -9.15185546875, -8.618408203125, -8.0849609375, -7.551513671875, -7.01806640625, -6.484619140625, -5.951171875, -5.417724609375, -4.88427734375, -4.350830078125, -3.8173828125, -3.283935546875, -2.75048828125, -2.217041015625, -1.68359375, -1.150146484375, -0.61669921875, -0.083251953125, 0.4501953125, 0.983642578125, 1.51708984375, 2.050537109375, 2.583984375, 3.117431640625, 3.65087890625, 4.184326171875, 4.7177734375, 5.251220703125, 5.78466796875, 6.318115234375, 6.8515625, 7.385009765625, 7.91845703125, 8.451904296875, 8.9853515625, 9.518798828125, 10.05224609375, 10.585693359375, 11.119140625, 11.652587890625, 12.18603515625, 12.719482421875, 13.2529296875, 13.786376953125, 14.31982421875, 14.853271484375, 15.38671875, 15.920166015625, 16.45361328125, 16.987060546875, 17.5205078125, 18.053955078125, 18.58740234375, 19.120849609375, 19.654296875, 20.187744140625, 20.72119140625, 21.254638671875, 21.7880859375, 22.321533203125, 22.85498046875, 23.388427734375, 23.921875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 2.0, 9.0, 11.0, 11.0, 12.0, 15.0, 30.0, 50.0, 52.0, 85.0, 123.0, 165.0, 310.0, 474.0, 595.0, 687.0, 514.0, 313.0, 190.0, 120.0, 93.0, 54.0, 24.0, 32.0, 25.0, 16.0, 10.0, 14.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0], "bins": [-1.9453125, -1.8941650390625, -1.843017578125, -1.7918701171875, -1.74072265625, -1.6895751953125, -1.638427734375, -1.5872802734375, -1.5361328125, -1.4849853515625, -1.433837890625, -1.3826904296875, -1.33154296875, -1.2803955078125, -1.229248046875, -1.1781005859375, -1.126953125, -1.0758056640625, -1.024658203125, -0.9735107421875, -0.92236328125, -0.8712158203125, -0.820068359375, -0.7689208984375, -0.7177734375, -0.6666259765625, -0.615478515625, -0.5643310546875, -0.51318359375, -0.4620361328125, -0.410888671875, -0.3597412109375, -0.30859375, -0.2574462890625, -0.206298828125, -0.1551513671875, -0.10400390625, -0.0528564453125, -0.001708984375, 0.0494384765625, 0.1005859375, 0.1517333984375, 0.202880859375, 0.2540283203125, 0.30517578125, 0.3563232421875, 0.407470703125, 0.4586181640625, 0.509765625, 0.5609130859375, 0.612060546875, 0.6632080078125, 0.71435546875, 0.7655029296875, 0.816650390625, 0.8677978515625, 0.9189453125, 0.9700927734375, 1.021240234375, 1.0723876953125, 1.12353515625, 1.1746826171875, 1.225830078125, 1.2769775390625, 1.328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 2.0, 10.0, 16.0, 22.0, 25.0, 41.0, 71.0, 100.0, 131.0, 143.0, 115.0, 137.0, 80.0, 37.0, 30.0, 25.0, 15.0, 11.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.551288604736328, -3.272958993911743, -2.994629383087158, -2.716299533843994, -2.437969923019409, -2.159640312194824, -1.8813105821609497, -1.6029808521270752, -1.3246512413024902, -1.0463216304779053, -0.7679919004440308, -0.489662230014801, -0.2113325595855713, 0.06699705123901367, 0.3453267812728882, 0.6236565113067627, 0.9019861221313477, 1.1803157329559326, 1.4586454629898071, 1.7369751930236816, 2.0153048038482666, 2.2936344146728516, 2.5719642639160156, 2.8502938747406006, 3.1286234855651855, 3.4069530963897705, 3.6852827072143555, 3.9636125564575195, 4.241942405700684, 4.5202717781066895, 4.7986016273498535, 5.076930999755859, 5.355259895324707, 5.633589744567871, 5.911919116973877, 6.190248966217041, 6.468578338623047, 6.746908187866211, 7.025238037109375, 7.303567886352539, 7.581897258758545, 7.860227108001709, 8.138556480407715, 8.416886329650879, 8.695216178894043, 8.97354507446289, 9.251874923706055, 9.530204772949219, 9.808534622192383, 10.086864471435547, 10.365194320678711, 10.643523216247559, 10.921853065490723, 11.200182914733887, 11.47851276397705, 11.756842613220215, 12.035171508789062, 12.313501358032227, 12.59183120727539, 12.870160102844238, 13.148489952087402, 13.426819801330566, 13.70514965057373, 13.983479499816895, 14.261809349060059]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 2.0, 5.0, 10.0, 12.0, 14.0, 13.0, 18.0, 18.0, 22.0, 27.0, 24.0, 32.0, 42.0, 33.0, 39.0, 31.0, 49.0, 40.0, 39.0, 47.0, 46.0, 48.0, 49.0, 34.0, 35.0, 26.0, 33.0, 24.0, 24.0, 31.0, 28.0, 19.0, 27.0, 12.0, 11.0, 8.0, 4.0, 4.0, 7.0, 4.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3730459213256836, -3.2639875411987305, -3.1549289226531982, -3.045870542526245, -2.936811923980713, -2.8277535438537598, -2.7186951637268066, -2.6096365451812744, -2.500577926635742, -2.391519546508789, -2.282460927963257, -2.1734025478363037, -2.0643439292907715, -1.9552855491638184, -1.8462270498275757, -1.737168550491333, -1.6281101703643799, -1.5190516710281372, -1.4099931716918945, -1.3009347915649414, -1.1918761730194092, -1.082817792892456, -0.9737592935562134, -0.8647007942199707, -0.755642294883728, -0.6465837955474854, -0.5375252962112427, -0.4284668564796448, -0.3194083571434021, -0.21034985780715942, -0.10129141807556152, 0.007767081260681152, 0.11682581901550293, 0.2258843034505844, 0.3349427878856659, 0.4440012574195862, 0.5530597567558289, 0.6621182560920715, 0.7711766958236694, 0.8802351951599121, 0.9892936944961548, 1.0983521938323975, 1.2074106931686401, 1.3164691925048828, 1.425527572631836, 1.5345861911773682, 1.6436445713043213, 1.752703070640564, 1.8617615699768066, 1.9708200693130493, 2.079878568649292, 2.188936948776245, 2.2979955673217773, 2.4070539474487305, 2.5161123275756836, 2.625170946121216, 2.734229564666748, 2.843287944793701, 2.9523465633392334, 3.0614049434661865, 3.1704635620117188, 3.279521942138672, 3.388580322265625, 3.4976389408111572, 3.6066973209381104]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 9.0, 19.0, 22.0, 38.0, 63.0, 97.0, 135.0, 274.0, 477.0, 875.0, 1606.0, 3406.0, 7035.0, 15521.0, 38356.0, 109111.0, 332785.0, 348906.0, 117532.0, 40749.0, 16876.0, 7297.0, 3575.0, 1685.0, 908.0, 503.0, 276.0, 151.0, 85.0, 55.0, 46.0, 20.0, 14.0, 15.0, 10.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3486328125, -1.3101348876953125, -1.271636962890625, -1.2331390380859375, -1.19464111328125, -1.1561431884765625, -1.117645263671875, -1.0791473388671875, -1.0406494140625, -1.0021514892578125, -0.963653564453125, -0.9251556396484375, -0.88665771484375, -0.8481597900390625, -0.809661865234375, -0.7711639404296875, -0.732666015625, -0.6941680908203125, -0.655670166015625, -0.6171722412109375, -0.57867431640625, -0.5401763916015625, -0.501678466796875, -0.4631805419921875, -0.4246826171875, -0.3861846923828125, -0.347686767578125, -0.3091888427734375, -0.27069091796875, -0.2321929931640625, -0.193695068359375, -0.1551971435546875, -0.11669921875, -0.0782012939453125, -0.039703369140625, -0.0012054443359375, 0.03729248046875, 0.0757904052734375, 0.114288330078125, 0.1527862548828125, 0.1912841796875, 0.2297821044921875, 0.268280029296875, 0.3067779541015625, 0.34527587890625, 0.3837738037109375, 0.422271728515625, 0.4607696533203125, 0.499267578125, 0.5377655029296875, 0.576263427734375, 0.6147613525390625, 0.65325927734375, 0.6917572021484375, 0.730255126953125, 0.7687530517578125, 0.8072509765625, 0.8457489013671875, 0.884246826171875, 0.9227447509765625, 0.96124267578125, 0.9997406005859375, 1.038238525390625, 1.0767364501953125, 1.115234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 4.0, 7.0, 12.0, 7.0, 12.0, 18.0, 20.0, 25.0, 23.0, 22.0, 36.0, 43.0, 28.0, 47.0, 53.0, 47.0, 40.0, 57.0, 39.0, 43.0, 61.0, 47.0, 43.0, 31.0, 38.0, 24.0, 25.0, 31.0, 21.0, 21.0, 15.0, 17.0, 8.0, 8.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -2.00445556640625, -1.9346923828125, -1.86492919921875, -1.795166015625, -1.72540283203125, -1.6556396484375, -1.58587646484375, -1.51611328125, -1.44635009765625, -1.3765869140625, -1.30682373046875, -1.237060546875, -1.16729736328125, -1.0975341796875, -1.02777099609375, -0.9580078125, -0.88824462890625, -0.8184814453125, -0.74871826171875, -0.678955078125, -0.60919189453125, -0.5394287109375, -0.46966552734375, -0.39990234375, -0.33013916015625, -0.2603759765625, -0.19061279296875, -0.120849609375, -0.05108642578125, 0.0186767578125, 0.08843994140625, 0.158203125, 0.22796630859375, 0.2977294921875, 0.36749267578125, 0.437255859375, 0.50701904296875, 0.5767822265625, 0.64654541015625, 0.71630859375, 0.78607177734375, 0.8558349609375, 0.92559814453125, 0.995361328125, 1.06512451171875, 1.1348876953125, 1.20465087890625, 1.2744140625, 1.34417724609375, 1.4139404296875, 1.48370361328125, 1.553466796875, 1.62322998046875, 1.6929931640625, 1.76275634765625, 1.83251953125, 1.90228271484375, 1.9720458984375, 2.04180908203125, 2.111572265625, 2.18133544921875, 2.2510986328125, 2.32086181640625, 2.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 11.0, 4.0, 2.0, 4.0, 8.0, 7.0, 15.0, 16.0, 19.0, 24.0, 40.0, 49.0, 76.0, 90.0, 176.0, 279.0, 509.0, 1095.0, 2495.0, 6740.0, 21466.0, 87487.0, 448872.0, 378949.0, 71471.0, 18235.0, 5877.0, 2272.0, 1054.0, 476.0, 245.0, 181.0, 88.0, 75.0, 36.0, 30.0, 19.0, 19.0, 15.0, 6.0, 10.0, 10.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55078125, -1.4989776611328125, -1.447174072265625, -1.3953704833984375, -1.34356689453125, -1.2917633056640625, -1.239959716796875, -1.1881561279296875, -1.1363525390625, -1.0845489501953125, -1.032745361328125, -0.9809417724609375, -0.92913818359375, -0.8773345947265625, -0.825531005859375, -0.7737274169921875, -0.721923828125, -0.6701202392578125, -0.618316650390625, -0.5665130615234375, -0.51470947265625, -0.4629058837890625, -0.411102294921875, -0.3592987060546875, -0.3074951171875, -0.2556915283203125, -0.203887939453125, -0.1520843505859375, -0.10028076171875, -0.0484771728515625, 0.003326416015625, 0.0551300048828125, 0.10693359375, 0.1587371826171875, 0.210540771484375, 0.2623443603515625, 0.31414794921875, 0.3659515380859375, 0.417755126953125, 0.4695587158203125, 0.5213623046875, 0.5731658935546875, 0.624969482421875, 0.6767730712890625, 0.72857666015625, 0.7803802490234375, 0.832183837890625, 0.8839874267578125, 0.935791015625, 0.9875946044921875, 1.039398193359375, 1.0912017822265625, 1.14300537109375, 1.1948089599609375, 1.246612548828125, 1.2984161376953125, 1.3502197265625, 1.4020233154296875, 1.453826904296875, 1.5056304931640625, 1.55743408203125, 1.6092376708984375, 1.661041259765625, 1.7128448486328125, 1.7646484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 17.0, 13.0, 14.0, 14.0, 23.0, 24.0, 33.0, 37.0, 31.0, 46.0, 43.0, 53.0, 58.0, 43.0, 65.0, 72.0, 42.0, 50.0, 52.0, 32.0, 45.0, 33.0, 27.0, 25.0, 20.0, 14.0, 13.0, 13.0, 10.0, 5.0, 10.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.7623291015625, -5.591064453125, -5.4197998046875, -5.24853515625, -5.0772705078125, -4.906005859375, -4.7347412109375, -4.5634765625, -4.3922119140625, -4.220947265625, -4.0496826171875, -3.87841796875, -3.7071533203125, -3.535888671875, -3.3646240234375, -3.193359375, -3.0220947265625, -2.850830078125, -2.6795654296875, -2.50830078125, -2.3370361328125, -2.165771484375, -1.9945068359375, -1.8232421875, -1.6519775390625, -1.480712890625, -1.3094482421875, -1.13818359375, -0.9669189453125, -0.795654296875, -0.6243896484375, -0.453125, -0.2818603515625, -0.110595703125, 0.0606689453125, 0.23193359375, 0.4031982421875, 0.574462890625, 0.7457275390625, 0.9169921875, 1.0882568359375, 1.259521484375, 1.4307861328125, 1.60205078125, 1.7733154296875, 1.944580078125, 2.1158447265625, 2.287109375, 2.4583740234375, 2.629638671875, 2.8009033203125, 2.97216796875, 3.1434326171875, 3.314697265625, 3.4859619140625, 3.6572265625, 3.8284912109375, 3.999755859375, 4.1710205078125, 4.34228515625, 4.5135498046875, 4.684814453125, 4.8560791015625, 5.02734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 12.0, 7.0, 15.0, 26.0, 23.0, 56.0, 74.0, 94.0, 143.0, 223.0, 323.0, 498.0, 753.0, 1095.0, 1961.0, 3421.0, 6376.0, 16320.0, 70189.0, 558619.0, 322596.0, 41539.0, 11889.0, 5025.0, 2814.0, 1561.0, 934.0, 636.0, 408.0, 319.0, 192.0, 111.0, 86.0, 54.0, 39.0, 25.0, 24.0, 19.0, 15.0, 4.0, 6.0, 7.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.001953125, -0.9714508056640625, -0.940948486328125, -0.9104461669921875, -0.87994384765625, -0.8494415283203125, -0.818939208984375, -0.7884368896484375, -0.7579345703125, -0.7274322509765625, -0.696929931640625, -0.6664276123046875, -0.63592529296875, -0.6054229736328125, -0.574920654296875, -0.5444183349609375, -0.513916015625, -0.4834136962890625, -0.452911376953125, -0.4224090576171875, -0.39190673828125, -0.3614044189453125, -0.330902099609375, -0.3003997802734375, -0.2698974609375, -0.2393951416015625, -0.208892822265625, -0.1783905029296875, -0.14788818359375, -0.1173858642578125, -0.086883544921875, -0.0563812255859375, -0.02587890625, 0.0046234130859375, 0.035125732421875, 0.0656280517578125, 0.09613037109375, 0.1266326904296875, 0.157135009765625, 0.1876373291015625, 0.2181396484375, 0.2486419677734375, 0.279144287109375, 0.3096466064453125, 0.34014892578125, 0.3706512451171875, 0.401153564453125, 0.4316558837890625, 0.462158203125, 0.4926605224609375, 0.523162841796875, 0.5536651611328125, 0.58416748046875, 0.6146697998046875, 0.645172119140625, 0.6756744384765625, 0.7061767578125, 0.7366790771484375, 0.767181396484375, 0.7976837158203125, 0.82818603515625, 0.8586883544921875, 0.889190673828125, 0.9196929931640625, 0.9501953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 10.0, 19.0, 17.0, 28.0, 37.0, 51.0, 90.0, 97.0, 132.0, 138.0, 100.0, 71.0, 43.0, 41.0, 28.0, 22.0, 10.0, 7.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0004513263702392578, -0.00043908506631851196, -0.0004268437623977661, -0.00041460245847702026, -0.0004023611545562744, -0.00039011985063552856, -0.0003778785467147827, -0.00036563724279403687, -0.000353395938873291, -0.00034115463495254517, -0.0003289133310317993, -0.00031667202711105347, -0.0003044307231903076, -0.00029218941926956177, -0.0002799481153488159, -0.00026770681142807007, -0.0002554655075073242, -0.00024322420358657837, -0.00023098289966583252, -0.00021874159574508667, -0.00020650029182434082, -0.00019425898790359497, -0.00018201768398284912, -0.00016977638006210327, -0.00015753507614135742, -0.00014529377222061157, -0.00013305246829986572, -0.00012081116437911987, -0.00010856986045837402, -9.632855653762817e-05, -8.408725261688232e-05, -7.184594869613647e-05, -5.9604644775390625e-05, -4.7363340854644775e-05, -3.5122036933898926e-05, -2.2880733013153076e-05, -1.0639429092407227e-05, 1.601874828338623e-06, 1.3843178749084473e-05, 2.6084482669830322e-05, 3.832578659057617e-05, 5.056709051132202e-05, 6.280839443206787e-05, 7.504969835281372e-05, 8.729100227355957e-05, 9.953230619430542e-05, 0.00011177361011505127, 0.00012401491403579712, 0.00013625621795654297, 0.00014849752187728882, 0.00016073882579803467, 0.00017298012971878052, 0.00018522143363952637, 0.00019746273756027222, 0.00020970404148101807, 0.00022194534540176392, 0.00023418664932250977, 0.0002464279532432556, 0.00025866925716400146, 0.0002709105610847473, 0.00028315186500549316, 0.000295393168926239, 0.00030763447284698486, 0.0003198757767677307, 0.00033211708068847656]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 8.0, 4.0, 10.0, 6.0, 17.0, 11.0, 25.0, 31.0, 62.0, 98.0, 150.0, 282.0, 398.0, 734.0, 1319.0, 2577.0, 5301.0, 12820.0, 47785.0, 373298.0, 508497.0, 66923.0, 15616.0, 5966.0, 2972.0, 1515.0, 870.0, 506.0, 269.0, 160.0, 100.0, 76.0, 33.0, 30.0, 19.0, 18.0, 10.0, 5.0, 9.0, 9.0, 4.0, 3.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.125, -1.09100341796875, -1.0570068359375, -1.02301025390625, -0.989013671875, -0.95501708984375, -0.9210205078125, -0.88702392578125, -0.85302734375, -0.81903076171875, -0.7850341796875, -0.75103759765625, -0.717041015625, -0.68304443359375, -0.6490478515625, -0.61505126953125, -0.5810546875, -0.54705810546875, -0.5130615234375, -0.47906494140625, -0.445068359375, -0.41107177734375, -0.3770751953125, -0.34307861328125, -0.30908203125, -0.27508544921875, -0.2410888671875, -0.20709228515625, -0.173095703125, -0.13909912109375, -0.1051025390625, -0.07110595703125, -0.037109375, -0.00311279296875, 0.0308837890625, 0.06488037109375, 0.098876953125, 0.13287353515625, 0.1668701171875, 0.20086669921875, 0.23486328125, 0.26885986328125, 0.3028564453125, 0.33685302734375, 0.370849609375, 0.40484619140625, 0.4388427734375, 0.47283935546875, 0.5068359375, 0.54083251953125, 0.5748291015625, 0.60882568359375, 0.642822265625, 0.67681884765625, 0.7108154296875, 0.74481201171875, 0.77880859375, 0.81280517578125, 0.8468017578125, 0.88079833984375, 0.914794921875, 0.94879150390625, 0.9827880859375, 1.01678466796875, 1.05078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 7.0, 6.0, 12.0, 7.0, 18.0, 16.0, 47.0, 74.0, 83.0, 101.0, 124.0, 108.0, 109.0, 77.0, 56.0, 42.0, 18.0, 15.0, 8.0, 6.0, 11.0, 6.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.21961212158203125, -0.2104644775390625, -0.20131683349609375, -0.192169189453125, -0.18302154541015625, -0.1738739013671875, -0.16472625732421875, -0.15557861328125, -0.14643096923828125, -0.1372833251953125, -0.12813568115234375, -0.118988037109375, -0.10984039306640625, -0.1006927490234375, -0.09154510498046875, -0.0823974609375, -0.07324981689453125, -0.0641021728515625, -0.05495452880859375, -0.045806884765625, -0.03665924072265625, -0.0275115966796875, -0.01836395263671875, -0.00921630859375, -6.866455078125e-05, 0.0090789794921875, 0.01822662353515625, 0.027374267578125, 0.03652191162109375, 0.0456695556640625, 0.05481719970703125, 0.06396484375, 0.07311248779296875, 0.0822601318359375, 0.09140777587890625, 0.100555419921875, 0.10970306396484375, 0.1188507080078125, 0.12799835205078125, 0.13714599609375, 0.14629364013671875, 0.1554412841796875, 0.16458892822265625, 0.173736572265625, 0.18288421630859375, 0.1920318603515625, 0.20117950439453125, 0.2103271484375, 0.21947479248046875, 0.2286224365234375, 0.23777008056640625, 0.246917724609375, 0.25606536865234375, 0.2652130126953125, 0.27436065673828125, 0.28350830078125, 0.29265594482421875, 0.3018035888671875, 0.31095123291015625, 0.320098876953125, 0.32924652099609375, 0.3383941650390625, 0.34754180908203125, 0.356689453125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 7.0, 6.0, 15.0, 21.0, 21.0, 44.0, 45.0, 60.0, 90.0, 107.0, 125.0, 114.0, 104.0, 86.0, 48.0, 49.0, 23.0, 19.0, 9.0, 10.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1956605911254883, -2.0638885498046875, -1.9321165084838867, -1.800344467163086, -1.6685724258422852, -1.5368003845214844, -1.4050283432006836, -1.2732563018798828, -1.141484260559082, -1.0097122192382812, -0.8779401779174805, -0.7461681365966797, -0.6143960952758789, -0.4826240539550781, -0.35085201263427734, -0.21907997131347656, -0.08730792999267578, 0.044464111328125, 0.17623615264892578, 0.30800819396972656, 0.43978023529052734, 0.5715522766113281, 0.7033243179321289, 0.8350963592529297, 0.9668684005737305, 1.0986404418945312, 1.230412483215332, 1.3621845245361328, 1.4939565658569336, 1.6257286071777344, 1.7575006484985352, 1.889272689819336, 2.0210442543029785, 2.1528162956237793, 2.28458833694458, 2.416360378265381, 2.5481324195861816, 2.6799044609069824, 2.811676502227783, 2.943448543548584, 3.0752205848693848, 3.2069926261901855, 3.3387646675109863, 3.470536708831787, 3.602308750152588, 3.7340807914733887, 3.8658528327941895, 3.9976248741149902, 4.129396915435791, 4.261168956756592, 4.392940998077393, 4.524713039398193, 4.656485080718994, 4.788257122039795, 4.920029163360596, 5.0518012046813965, 5.183573246002197, 5.315345287322998, 5.447117328643799, 5.5788893699646, 5.7106614112854, 5.842433452606201, 5.974205493927002, 6.105977535247803, 6.2377495765686035]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 10.0, 12.0, 18.0, 18.0, 17.0, 21.0, 23.0, 30.0, 35.0, 27.0, 39.0, 56.0, 55.0, 34.0, 39.0, 39.0, 50.0, 50.0, 54.0, 45.0, 45.0, 26.0, 42.0, 35.0, 31.0, 23.0, 21.0, 24.0, 17.0, 12.0, 6.0, 9.0, 6.0, 3.0, 1.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05198073387146, -1.9827872514724731, -1.9135937690734863, -1.8444002866744995, -1.7752068042755127, -1.7060132026672363, -1.6368197202682495, -1.5676262378692627, -1.4984327554702759, -1.429239273071289, -1.3600457906723022, -1.2908523082733154, -1.221658706665039, -1.1524653434753418, -1.0832717418670654, -1.0140782594680786, -0.9448847770690918, -0.875691294670105, -0.8064978122711182, -0.7373042702674866, -0.6681107878684998, -0.5989173054695129, -0.5297237634658813, -0.46053028106689453, -0.3913367986679077, -0.3221433162689209, -0.2529498040676117, -0.18375630676746368, -0.11456280946731567, -0.04536932706832886, 0.023824185132980347, 0.09301769733428955, 0.16221117973327637, 0.23140467703342438, 0.3005981743335724, 0.3697916865348816, 0.4389851689338684, 0.5081786513328552, 0.5773721933364868, 0.6465656757354736, 0.7157591581344604, 0.7849526405334473, 0.8541461229324341, 0.9233396649360657, 0.9925331473350525, 1.0617265701293945, 1.130920171737671, 1.2001136541366577, 1.2693071365356445, 1.3385006189346313, 1.4076941013336182, 1.476887583732605, 1.5460810661315918, 1.6152746677398682, 1.684468150138855, 1.7536616325378418, 1.8228551149368286, 1.8920485973358154, 1.9612420797348022, 2.030435562133789, 2.0996291637420654, 2.1688225269317627, 2.238016128540039, 2.3072094917297363, 2.3764030933380127]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 16.0, 20.0, 35.0, 53.0, 79.0, 145.0, 274.0, 491.0, 1102.0, 2442.0, 6339.0, 19377.0, 74314.0, 434389.0, 409823.0, 70464.0, 18500.0, 6109.0, 2359.0, 1044.0, 543.0, 263.0, 133.0, 92.0, 45.0, 29.0, 30.0, 13.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.67578125, -4.549346923828125, -4.42291259765625, -4.296478271484375, -4.1700439453125, -4.043609619140625, -3.91717529296875, -3.790740966796875, -3.664306640625, -3.537872314453125, -3.41143798828125, -3.285003662109375, -3.1585693359375, -3.032135009765625, -2.90570068359375, -2.779266357421875, -2.65283203125, -2.526397705078125, -2.39996337890625, -2.273529052734375, -2.1470947265625, -2.020660400390625, -1.89422607421875, -1.767791748046875, -1.641357421875, -1.514923095703125, -1.38848876953125, -1.262054443359375, -1.1356201171875, -1.009185791015625, -0.88275146484375, -0.756317138671875, -0.6298828125, -0.503448486328125, -0.37701416015625, -0.250579833984375, -0.1241455078125, 0.002288818359375, 0.12872314453125, 0.255157470703125, 0.381591796875, 0.508026123046875, 0.63446044921875, 0.760894775390625, 0.8873291015625, 1.013763427734375, 1.14019775390625, 1.266632080078125, 1.39306640625, 1.519500732421875, 1.64593505859375, 1.772369384765625, 1.8988037109375, 2.025238037109375, 2.15167236328125, 2.278106689453125, 2.404541015625, 2.530975341796875, 2.65740966796875, 2.783843994140625, 2.9102783203125, 3.036712646484375, 3.16314697265625, 3.289581298828125, 3.416015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 5.0, 8.0, 15.0, 18.0, 23.0, 23.0, 26.0, 33.0, 51.0, 45.0, 33.0, 55.0, 57.0, 55.0, 66.0, 52.0, 48.0, 66.0, 55.0, 56.0, 47.0, 36.0, 28.0, 25.0, 18.0, 14.0, 5.0, 14.0, 4.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.69134521484375, -4.4998779296875, -4.30841064453125, -4.116943359375, -3.92547607421875, -3.7340087890625, -3.54254150390625, -3.35107421875, -3.15960693359375, -2.9681396484375, -2.77667236328125, -2.585205078125, -2.39373779296875, -2.2022705078125, -2.01080322265625, -1.8193359375, -1.62786865234375, -1.4364013671875, -1.24493408203125, -1.053466796875, -0.86199951171875, -0.6705322265625, -0.47906494140625, -0.28759765625, -0.09613037109375, 0.0953369140625, 0.28680419921875, 0.478271484375, 0.66973876953125, 0.8612060546875, 1.05267333984375, 1.244140625, 1.43560791015625, 1.6270751953125, 1.81854248046875, 2.010009765625, 2.20147705078125, 2.3929443359375, 2.58441162109375, 2.77587890625, 2.96734619140625, 3.1588134765625, 3.35028076171875, 3.541748046875, 3.73321533203125, 3.9246826171875, 4.11614990234375, 4.3076171875, 4.49908447265625, 4.6905517578125, 4.88201904296875, 5.073486328125, 5.26495361328125, 5.4564208984375, 5.64788818359375, 5.83935546875, 6.03082275390625, 6.2222900390625, 6.41375732421875, 6.605224609375, 6.79669189453125, 6.9881591796875, 7.17962646484375, 7.37109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 9.0, 6.0, 13.0, 23.0, 32.0, 67.0, 83.0, 180.0, 462.0, 1594.0, 9489.0, 140000.0, 841695.0, 48383.0, 4894.0, 978.0, 303.0, 143.0, 81.0, 36.0, 24.0, 18.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.53125, -6.2734375, -6.015625, -5.7578125, -5.5, -5.2421875, -4.984375, -4.7265625, -4.46875, -4.2109375, -3.953125, -3.6953125, -3.4375, -3.1796875, -2.921875, -2.6640625, -2.40625, -2.1484375, -1.890625, -1.6328125, -1.375, -1.1171875, -0.859375, -0.6015625, -0.34375, -0.0859375, 0.171875, 0.4296875, 0.6875, 0.9453125, 1.203125, 1.4609375, 1.71875, 1.9765625, 2.234375, 2.4921875, 2.75, 3.0078125, 3.265625, 3.5234375, 3.78125, 4.0390625, 4.296875, 4.5546875, 4.8125, 5.0703125, 5.328125, 5.5859375, 5.84375, 6.1015625, 6.359375, 6.6171875, 6.875, 7.1328125, 7.390625, 7.6484375, 7.90625, 8.1640625, 8.421875, 8.6796875, 8.9375, 9.1953125, 9.453125, 9.7109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 14.0, 9.0, 20.0, 23.0, 21.0, 23.0, 38.0, 33.0, 31.0, 45.0, 39.0, 54.0, 57.0, 66.0, 67.0, 57.0, 55.0, 52.0, 55.0, 38.0, 46.0, 18.0, 17.0, 19.0, 23.0, 18.0, 10.0, 10.0, 12.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.036865234375, -5.81982421875, -5.602783203125, -5.3857421875, -5.168701171875, -4.95166015625, -4.734619140625, -4.517578125, -4.300537109375, -4.08349609375, -3.866455078125, -3.6494140625, -3.432373046875, -3.21533203125, -2.998291015625, -2.78125, -2.564208984375, -2.34716796875, -2.130126953125, -1.9130859375, -1.696044921875, -1.47900390625, -1.261962890625, -1.044921875, -0.827880859375, -0.61083984375, -0.393798828125, -0.1767578125, 0.040283203125, 0.25732421875, 0.474365234375, 0.69140625, 0.908447265625, 1.12548828125, 1.342529296875, 1.5595703125, 1.776611328125, 1.99365234375, 2.210693359375, 2.427734375, 2.644775390625, 2.86181640625, 3.078857421875, 3.2958984375, 3.512939453125, 3.72998046875, 3.947021484375, 4.1640625, 4.381103515625, 4.59814453125, 4.815185546875, 5.0322265625, 5.249267578125, 5.46630859375, 5.683349609375, 5.900390625, 6.117431640625, 6.33447265625, 6.551513671875, 6.7685546875, 6.985595703125, 7.20263671875, 7.419677734375, 7.63671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 8.0, 15.0, 12.0, 30.0, 44.0, 50.0, 138.0, 399.0, 1955.0, 13733.0, 198038.0, 780760.0, 47027.0, 5042.0, 889.0, 206.0, 79.0, 41.0, 19.0, 15.0, 13.0, 7.0, 6.0, 6.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.146484375, -2.085601806640625, -2.02471923828125, -1.963836669921875, -1.9029541015625, -1.842071533203125, -1.78118896484375, -1.720306396484375, -1.659423828125, -1.598541259765625, -1.53765869140625, -1.476776123046875, -1.4158935546875, -1.355010986328125, -1.29412841796875, -1.233245849609375, -1.17236328125, -1.111480712890625, -1.05059814453125, -0.989715576171875, -0.9288330078125, -0.867950439453125, -0.80706787109375, -0.746185302734375, -0.685302734375, -0.624420166015625, -0.56353759765625, -0.502655029296875, -0.4417724609375, -0.380889892578125, -0.32000732421875, -0.259124755859375, -0.1982421875, -0.137359619140625, -0.07647705078125, -0.015594482421875, 0.0452880859375, 0.106170654296875, 0.16705322265625, 0.227935791015625, 0.288818359375, 0.349700927734375, 0.41058349609375, 0.471466064453125, 0.5323486328125, 0.593231201171875, 0.65411376953125, 0.714996337890625, 0.77587890625, 0.836761474609375, 0.89764404296875, 0.958526611328125, 1.0194091796875, 1.080291748046875, 1.14117431640625, 1.202056884765625, 1.262939453125, 1.323822021484375, 1.38470458984375, 1.445587158203125, 1.5064697265625, 1.567352294921875, 1.62823486328125, 1.689117431640625, 1.75]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 12.0, 6.0, 11.0, 26.0, 32.0, 40.0, 74.0, 84.0, 136.0, 191.0, 121.0, 83.0, 44.0, 37.0, 32.0, 11.0, 17.0, 10.0, 7.0, 5.0, 2.0, 3.0, 4.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0002899169921875, -0.00028253719210624695, -0.0002751573920249939, -0.00026777759194374084, -0.0002603977918624878, -0.00025301799178123474, -0.0002456381916999817, -0.00023825839161872864, -0.00023087859153747559, -0.00022349879145622253, -0.00021611899137496948, -0.00020873919129371643, -0.00020135939121246338, -0.00019397959113121033, -0.00018659979104995728, -0.00017921999096870422, -0.00017184019088745117, -0.00016446039080619812, -0.00015708059072494507, -0.00014970079064369202, -0.00014232099056243896, -0.0001349411904811859, -0.00012756139039993286, -0.00012018159031867981, -0.00011280179023742676, -0.0001054219901561737, -9.804219007492065e-05, -9.06623899936676e-05, -8.328258991241455e-05, -7.59027898311615e-05, -6.852298974990845e-05, -6.11431896686554e-05, -5.3763389587402344e-05, -4.638358950614929e-05, -3.900378942489624e-05, -3.162398934364319e-05, -2.4244189262390137e-05, -1.6864389181137085e-05, -9.484589099884033e-06, -2.1047890186309814e-06, 5.27501106262207e-06, 1.2654811143875122e-05, 2.0034611225128174e-05, 2.7414411306381226e-05, 3.479421138763428e-05, 4.217401146888733e-05, 4.955381155014038e-05, 5.693361163139343e-05, 6.431341171264648e-05, 7.169321179389954e-05, 7.907301187515259e-05, 8.645281195640564e-05, 9.383261203765869e-05, 0.00010121241211891174, 0.0001085922122001648, 0.00011597201228141785, 0.0001233518123626709, 0.00013073161244392395, 0.000138111412525177, 0.00014549121260643005, 0.0001528710126876831, 0.00016025081276893616, 0.0001676306128501892, 0.00017501041293144226, 0.0001823902130126953]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 10.0, 10.0, 14.0, 28.0, 31.0, 51.0, 111.0, 181.0, 335.0, 738.0, 1802.0, 5877.0, 25980.0, 168766.0, 663766.0, 149340.0, 22999.0, 5312.0, 1729.0, 682.0, 352.0, 182.0, 102.0, 43.0, 44.0, 21.0, 13.0, 11.0, 12.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0479888916015625, -1.005157470703125, -0.9623260498046875, -0.91949462890625, -0.8766632080078125, -0.833831787109375, -0.7910003662109375, -0.7481689453125, -0.7053375244140625, -0.662506103515625, -0.6196746826171875, -0.57684326171875, -0.5340118408203125, -0.491180419921875, -0.4483489990234375, -0.405517578125, -0.3626861572265625, -0.319854736328125, -0.2770233154296875, -0.23419189453125, -0.1913604736328125, -0.148529052734375, -0.1056976318359375, -0.0628662109375, -0.0200347900390625, 0.022796630859375, 0.0656280517578125, 0.10845947265625, 0.1512908935546875, 0.194122314453125, 0.2369537353515625, 0.27978515625, 0.3226165771484375, 0.365447998046875, 0.4082794189453125, 0.45111083984375, 0.4939422607421875, 0.536773681640625, 0.5796051025390625, 0.6224365234375, 0.6652679443359375, 0.708099365234375, 0.7509307861328125, 0.79376220703125, 0.8365936279296875, 0.879425048828125, 0.9222564697265625, 0.965087890625, 1.0079193115234375, 1.050750732421875, 1.0935821533203125, 1.13641357421875, 1.1792449951171875, 1.222076416015625, 1.2649078369140625, 1.3077392578125, 1.3505706787109375, 1.393402099609375, 1.4362335205078125, 1.47906494140625, 1.5218963623046875, 1.564727783203125, 1.6075592041015625, 1.650390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 16.0, 1.0, 12.0, 23.0, 29.0, 40.0, 59.0, 64.0, 97.0, 154.0, 145.0, 98.0, 78.0, 59.0, 50.0, 29.0, 23.0, 14.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9462890625, -0.92205810546875, -0.8978271484375, -0.87359619140625, -0.849365234375, -0.82513427734375, -0.8009033203125, -0.77667236328125, -0.75244140625, -0.72821044921875, -0.7039794921875, -0.67974853515625, -0.655517578125, -0.63128662109375, -0.6070556640625, -0.58282470703125, -0.55859375, -0.53436279296875, -0.5101318359375, -0.48590087890625, -0.461669921875, -0.43743896484375, -0.4132080078125, -0.38897705078125, -0.36474609375, -0.34051513671875, -0.3162841796875, -0.29205322265625, -0.267822265625, -0.24359130859375, -0.2193603515625, -0.19512939453125, -0.1708984375, -0.14666748046875, -0.1224365234375, -0.09820556640625, -0.073974609375, -0.04974365234375, -0.0255126953125, -0.00128173828125, 0.02294921875, 0.04718017578125, 0.0714111328125, 0.09564208984375, 0.119873046875, 0.14410400390625, 0.1683349609375, 0.19256591796875, 0.216796875, 0.24102783203125, 0.2652587890625, 0.28948974609375, 0.313720703125, 0.33795166015625, 0.3621826171875, 0.38641357421875, 0.41064453125, 0.43487548828125, 0.4591064453125, 0.48333740234375, 0.507568359375, 0.53179931640625, 0.5560302734375, 0.58026123046875, 0.6044921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 13.0, 10.0, 22.0, 41.0, 47.0, 83.0, 103.0, 126.0, 130.0, 140.0, 94.0, 83.0, 47.0, 30.0, 22.0, 10.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.41785717010498, -10.076034545898438, -9.734212875366211, -9.392390251159668, -9.050567626953125, -8.708745956420898, -8.366923332214355, -8.025100708007812, -7.683279037475586, -7.341456890106201, -6.999634742736816, -6.657812118530273, -6.315989971160889, -5.974167823791504, -5.632345199584961, -5.290523052215576, -4.948700904846191, -4.606878757476807, -4.265056610107422, -3.923233985900879, -3.581411838531494, -3.2395896911621094, -2.8977673053741455, -2.5559449195861816, -2.214122772216797, -1.8723005056381226, -1.5304782390594482, -1.188655972480774, -0.8468337059020996, -0.5050114393234253, -0.16318917274475098, 0.1786332130432129, 0.5204553604125977, 0.862277626991272, 1.2040998935699463, 1.5459221601486206, 1.887744426727295, 2.2295665740966797, 2.5713889598846436, 2.9132113456726074, 3.255033493041992, 3.596855640411377, 3.938678026199341, 4.280500411987305, 4.6223225593566895, 4.964144706726074, 5.305967330932617, 5.647789478302002, 5.989611625671387, 6.3314337730407715, 6.673255920410156, 7.015078544616699, 7.356900691986084, 7.698722839355469, 8.040545463562012, 8.382368087768555, 8.724189758300781, 9.066012382507324, 9.40783405303955, 9.749656677246094, 10.09147834777832, 10.433300971984863, 10.775123596191406, 11.116945266723633, 11.458767890930176]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 9.0, 8.0, 10.0, 7.0, 11.0, 22.0, 20.0, 25.0, 21.0, 30.0, 28.0, 42.0, 41.0, 41.0, 59.0, 38.0, 54.0, 37.0, 59.0, 47.0, 49.0, 35.0, 41.0, 28.0, 34.0, 36.0, 18.0, 33.0, 16.0, 19.0, 16.0, 12.0, 16.0, 9.0, 7.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-11.993329048156738, -11.681588172912598, -11.369847297668457, -11.058106422424316, -10.746365547180176, -10.434624671936035, -10.122883796691895, -9.811142921447754, -9.499402046203613, -9.187661170959473, -8.875920295715332, -8.564179420471191, -8.25243854522705, -7.94069766998291, -7.6289567947387695, -7.317215919494629, -7.005475044250488, -6.693734169006348, -6.381993293762207, -6.070252418518066, -5.758511543273926, -5.446770668029785, -5.1350297927856445, -4.823288917541504, -4.511548042297363, -4.199807167053223, -3.888066291809082, -3.5763254165649414, -3.264584541320801, -2.95284366607666, -2.6411027908325195, -2.329361915588379, -2.0176210403442383, -1.7058801651000977, -1.394139289855957, -1.0823984146118164, -0.7706575393676758, -0.45891666412353516, -0.14717578887939453, 0.1645650863647461, 0.4763059616088867, 0.7880468368530273, 1.099787712097168, 1.4115285873413086, 1.7232694625854492, 2.03501033782959, 2.3467512130737305, 2.658492088317871, 2.9702329635620117, 3.2819738388061523, 3.593714714050293, 3.9054555892944336, 4.217196464538574, 4.528937339782715, 4.8406782150268555, 5.152419090270996, 5.464159965515137, 5.775900840759277, 6.087641716003418, 6.399382591247559, 6.711123466491699, 7.02286434173584, 7.3346052169799805, 7.646346092224121, 7.958086967468262]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 8.0, 11.0, 12.0, 15.0, 26.0, 31.0, 33.0, 48.0, 73.0, 126.0, 205.0, 347.0, 673.0, 1603.0, 4264.0, 16446.0, 142702.0, 3569547.0, 419988.0, 27313.0, 6744.0, 2101.0, 805.0, 467.0, 227.0, 126.0, 87.0, 72.0, 46.0, 35.0, 20.0, 19.0, 12.0, 12.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.828125, -8.59356689453125, -8.3590087890625, -8.12445068359375, -7.889892578125, -7.65533447265625, -7.4207763671875, -7.18621826171875, -6.95166015625, -6.71710205078125, -6.4825439453125, -6.24798583984375, -6.013427734375, -5.77886962890625, -5.5443115234375, -5.30975341796875, -5.0751953125, -4.84063720703125, -4.6060791015625, -4.37152099609375, -4.136962890625, -3.90240478515625, -3.6678466796875, -3.43328857421875, -3.19873046875, -2.96417236328125, -2.7296142578125, -2.49505615234375, -2.260498046875, -2.02593994140625, -1.7913818359375, -1.55682373046875, -1.322265625, -1.08770751953125, -0.8531494140625, -0.61859130859375, -0.384033203125, -0.14947509765625, 0.0850830078125, 0.31964111328125, 0.55419921875, 0.78875732421875, 1.0233154296875, 1.25787353515625, 1.492431640625, 1.72698974609375, 1.9615478515625, 2.19610595703125, 2.4306640625, 2.66522216796875, 2.8997802734375, 3.13433837890625, 3.368896484375, 3.60345458984375, 3.8380126953125, 4.07257080078125, 4.30712890625, 4.54168701171875, 4.7762451171875, 5.01080322265625, 5.245361328125, 5.47991943359375, 5.7144775390625, 5.94903564453125, 6.18359375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 8.0, 11.0, 26.0, 28.0, 44.0, 58.0, 64.0, 77.0, 66.0, 113.0, 92.0, 83.0, 72.0, 69.0, 58.0, 44.0, 29.0, 21.0, 15.0, 6.0, 5.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.23046875, -5.096405029296875, -4.96234130859375, -4.828277587890625, -4.6942138671875, -4.560150146484375, -4.42608642578125, -4.292022705078125, -4.157958984375, -4.023895263671875, -3.88983154296875, -3.755767822265625, -3.6217041015625, -3.487640380859375, -3.35357666015625, -3.219512939453125, -3.08544921875, -2.951385498046875, -2.81732177734375, -2.683258056640625, -2.5491943359375, -2.415130615234375, -2.28106689453125, -2.147003173828125, -2.012939453125, -1.878875732421875, -1.74481201171875, -1.610748291015625, -1.4766845703125, -1.342620849609375, -1.20855712890625, -1.074493408203125, -0.9404296875, -0.806365966796875, -0.67230224609375, -0.538238525390625, -0.4041748046875, -0.270111083984375, -0.13604736328125, -0.001983642578125, 0.132080078125, 0.266143798828125, 0.40020751953125, 0.534271240234375, 0.6683349609375, 0.802398681640625, 0.93646240234375, 1.070526123046875, 1.20458984375, 1.338653564453125, 1.47271728515625, 1.606781005859375, 1.7408447265625, 1.874908447265625, 2.00897216796875, 2.143035888671875, 2.277099609375, 2.411163330078125, 2.54522705078125, 2.679290771484375, 2.8133544921875, 2.947418212890625, 3.08148193359375, 3.215545654296875, 3.349609375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 7.0, 8.0, 11.0, 21.0, 33.0, 44.0, 68.0, 139.0, 339.0, 1126.0, 6032.0, 133551.0, 3983977.0, 63343.0, 4159.0, 796.0, 325.0, 110.0, 65.0, 37.0, 24.0, 15.0, 12.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.203125, -10.834716796875, -10.46630859375, -10.097900390625, -9.7294921875, -9.361083984375, -8.99267578125, -8.624267578125, -8.255859375, -7.887451171875, -7.51904296875, -7.150634765625, -6.7822265625, -6.413818359375, -6.04541015625, -5.677001953125, -5.30859375, -4.940185546875, -4.57177734375, -4.203369140625, -3.8349609375, -3.466552734375, -3.09814453125, -2.729736328125, -2.361328125, -1.992919921875, -1.62451171875, -1.256103515625, -0.8876953125, -0.519287109375, -0.15087890625, 0.217529296875, 0.5859375, 0.954345703125, 1.32275390625, 1.691162109375, 2.0595703125, 2.427978515625, 2.79638671875, 3.164794921875, 3.533203125, 3.901611328125, 4.27001953125, 4.638427734375, 5.0068359375, 5.375244140625, 5.74365234375, 6.112060546875, 6.48046875, 6.848876953125, 7.21728515625, 7.585693359375, 7.9541015625, 8.322509765625, 8.69091796875, 9.059326171875, 9.427734375, 9.796142578125, 10.16455078125, 10.532958984375, 10.9013671875, 11.269775390625, 11.63818359375, 12.006591796875, 12.375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 8.0, 15.0, 23.0, 38.0, 61.0, 78.0, 150.0, 245.0, 428.0, 736.0, 801.0, 655.0, 317.0, 193.0, 119.0, 58.0, 48.0, 22.0, 19.0, 12.0, 7.0, 9.0, 5.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.985260009765625, -1.92559814453125, -1.865936279296875, -1.8062744140625, -1.746612548828125, -1.68695068359375, -1.627288818359375, -1.567626953125, -1.507965087890625, -1.44830322265625, -1.388641357421875, -1.3289794921875, -1.269317626953125, -1.20965576171875, -1.149993896484375, -1.09033203125, -1.030670166015625, -0.97100830078125, -0.911346435546875, -0.8516845703125, -0.792022705078125, -0.73236083984375, -0.672698974609375, -0.613037109375, -0.553375244140625, -0.49371337890625, -0.434051513671875, -0.3743896484375, -0.314727783203125, -0.25506591796875, -0.195404052734375, -0.1357421875, -0.076080322265625, -0.01641845703125, 0.043243408203125, 0.1029052734375, 0.162567138671875, 0.22222900390625, 0.281890869140625, 0.341552734375, 0.401214599609375, 0.46087646484375, 0.520538330078125, 0.5802001953125, 0.639862060546875, 0.69952392578125, 0.759185791015625, 0.81884765625, 0.878509521484375, 0.93817138671875, 0.997833251953125, 1.0574951171875, 1.117156982421875, 1.17681884765625, 1.236480712890625, 1.296142578125, 1.355804443359375, 1.41546630859375, 1.475128173828125, 1.5347900390625, 1.594451904296875, 1.65411376953125, 1.713775634765625, 1.7734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 3.0, 7.0, 6.0, 11.0, 19.0, 26.0, 41.0, 55.0, 59.0, 63.0, 81.0, 84.0, 97.0, 89.0, 71.0, 62.0, 44.0, 49.0, 33.0, 19.0, 32.0, 20.0, 6.0, 11.0, 10.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8258464336395264, -2.6834685802459717, -2.541090965270996, -2.3987131118774414, -2.256335496902466, -2.113957643508911, -1.971579909324646, -1.8292021751403809, -1.6868244409561157, -1.5444467067718506, -1.4020689725875854, -1.2596912384033203, -1.1173133850097656, -0.9749357104301453, -0.8325579166412354, -0.6901801824569702, -0.5478024482727051, -0.40542471408843994, -0.2630469501018524, -0.12066918611526489, 0.021708548069000244, 0.16408628225326538, 0.3064640760421753, 0.44884181022644043, 0.5912195444107056, 0.7335972785949707, 0.8759750127792358, 1.018352746963501, 1.1607306003570557, 1.3031082153320312, 1.445486068725586, 1.587863802909851, 1.730241298675537, 1.8726190328598022, 2.0149967670440674, 2.157374620437622, 2.2997522354125977, 2.4421300888061523, 2.584507942199707, 2.7268855571746826, 2.869263172149658, 3.011641025543213, 3.1540186405181885, 3.296396493911743, 3.4387741088867188, 3.5811519622802734, 3.723529815673828, 3.8659074306488037, 4.0082855224609375, 4.150663375854492, 4.293041229248047, 4.435418605804443, 4.577796459197998, 4.720174312591553, 4.862552165985107, 5.004929542541504, 5.147307395935059, 5.289685249328613, 5.432063102722168, 5.5744404792785645, 5.716818332672119, 5.859196186065674, 6.0015740394592285, 6.143951416015625, 6.28632926940918]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 1.0, 5.0, 6.0, 8.0, 5.0, 15.0, 16.0, 14.0, 24.0, 24.0, 31.0, 19.0, 27.0, 40.0, 42.0, 47.0, 54.0, 41.0, 43.0, 42.0, 44.0, 29.0, 50.0, 50.0, 43.0, 47.0, 36.0, 26.0, 37.0, 24.0, 22.0, 13.0, 15.0, 19.0, 8.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8028488159179688, -2.707266330718994, -2.6116836071014404, -2.5161008834838867, -2.420518398284912, -2.3249359130859375, -2.229353189468384, -2.13377046585083, -2.0381879806518555, -1.9426053762435913, -1.8470227718353271, -1.751440167427063, -1.6558575630187988, -1.5602749586105347, -1.4646923542022705, -1.3691097497940063, -1.2735271453857422, -1.177944540977478, -1.0823619365692139, -0.9867793321609497, -0.8911967277526855, -0.7956141233444214, -0.7000315189361572, -0.6044489145278931, -0.5088663101196289, -0.41328370571136475, -0.3177011013031006, -0.22211849689483643, -0.12653589248657227, -0.030953288078308105, 0.06462931632995605, 0.16021192073822021, 0.2557945251464844, 0.35137712955474854, 0.4469597339630127, 0.5425423383712769, 0.638124942779541, 0.7337075471878052, 0.8292901515960693, 0.9248727560043335, 1.0204553604125977, 1.1160379648208618, 1.211620569229126, 1.3072031736373901, 1.4027857780456543, 1.4983683824539185, 1.5939509868621826, 1.6895335912704468, 1.785116195678711, 1.880698800086975, 1.9762814044952393, 2.071864128112793, 2.1674466133117676, 2.263029098510742, 2.358611822128296, 2.4541945457458496, 2.549777030944824, 2.645359516143799, 2.7409422397613525, 2.8365249633789062, 2.932107448577881, 3.0276899337768555, 3.123272657394409, 3.218855381011963, 3.3144378662109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 15.0, 12.0, 18.0, 46.0, 58.0, 77.0, 125.0, 167.0, 264.0, 407.0, 706.0, 1193.0, 2207.0, 4014.0, 8242.0, 20164.0, 75075.0, 355398.0, 434058.0, 101656.0, 24751.0, 9379.0, 4552.0, 2496.0, 1369.0, 787.0, 458.0, 308.0, 178.0, 105.0, 70.0, 51.0, 35.0, 26.0, 21.0, 12.0, 9.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0703125, -1.0379714965820312, -1.0056304931640625, -0.9732894897460938, -0.940948486328125, -0.9086074829101562, -0.8762664794921875, -0.8439254760742188, -0.81158447265625, -0.7792434692382812, -0.7469024658203125, -0.7145614624023438, -0.682220458984375, -0.6498794555664062, -0.6175384521484375, -0.5851974487304688, -0.5528564453125, -0.5205154418945312, -0.4881744384765625, -0.45583343505859375, -0.423492431640625, -0.39115142822265625, -0.3588104248046875, -0.32646942138671875, -0.29412841796875, -0.26178741455078125, -0.2294464111328125, -0.19710540771484375, -0.164764404296875, -0.13242340087890625, -0.1000823974609375, -0.06774139404296875, -0.035400390625, -0.00305938720703125, 0.0292816162109375, 0.06162261962890625, 0.093963623046875, 0.12630462646484375, 0.1586456298828125, 0.19098663330078125, 0.22332763671875, 0.25566864013671875, 0.2880096435546875, 0.32035064697265625, 0.352691650390625, 0.38503265380859375, 0.4173736572265625, 0.44971466064453125, 0.4820556640625, 0.5143966674804688, 0.5467376708984375, 0.5790786743164062, 0.611419677734375, 0.6437606811523438, 0.6761016845703125, 0.7084426879882812, 0.74078369140625, 0.7731246948242188, 0.8054656982421875, 0.8378067016601562, 0.870147705078125, 0.9024887084960938, 0.9348297119140625, 0.9671707153320312, 0.99951171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 4.0, 9.0, 4.0, 8.0, 14.0, 13.0, 19.0, 19.0, 25.0, 28.0, 23.0, 34.0, 36.0, 47.0, 46.0, 52.0, 56.0, 43.0, 50.0, 37.0, 50.0, 54.0, 44.0, 32.0, 39.0, 41.0, 25.0, 30.0, 19.0, 17.0, 15.0, 21.0, 11.0, 11.0, 9.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.96484375, -1.902099609375, -1.83935546875, -1.776611328125, -1.7138671875, -1.651123046875, -1.58837890625, -1.525634765625, -1.462890625, -1.400146484375, -1.33740234375, -1.274658203125, -1.2119140625, -1.149169921875, -1.08642578125, -1.023681640625, -0.9609375, -0.898193359375, -0.83544921875, -0.772705078125, -0.7099609375, -0.647216796875, -0.58447265625, -0.521728515625, -0.458984375, -0.396240234375, -0.33349609375, -0.270751953125, -0.2080078125, -0.145263671875, -0.08251953125, -0.019775390625, 0.04296875, 0.105712890625, 0.16845703125, 0.231201171875, 0.2939453125, 0.356689453125, 0.41943359375, 0.482177734375, 0.544921875, 0.607666015625, 0.67041015625, 0.733154296875, 0.7958984375, 0.858642578125, 0.92138671875, 0.984130859375, 1.046875, 1.109619140625, 1.17236328125, 1.235107421875, 1.2978515625, 1.360595703125, 1.42333984375, 1.486083984375, 1.548828125, 1.611572265625, 1.67431640625, 1.737060546875, 1.7998046875, 1.862548828125, 1.92529296875, 1.988037109375, 2.05078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 10.0, 10.0, 7.0, 21.0, 19.0, 39.0, 71.0, 110.0, 191.0, 422.0, 835.0, 1961.0, 5555.0, 19679.0, 147287.0, 694384.0, 148331.0, 20322.0, 5537.0, 1974.0, 829.0, 448.0, 222.0, 93.0, 64.0, 43.0, 18.0, 11.0, 10.0, 5.0, 7.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.6845703125, -1.637115478515625, -1.58966064453125, -1.542205810546875, -1.4947509765625, -1.447296142578125, -1.39984130859375, -1.352386474609375, -1.304931640625, -1.257476806640625, -1.21002197265625, -1.162567138671875, -1.1151123046875, -1.067657470703125, -1.02020263671875, -0.972747802734375, -0.92529296875, -0.877838134765625, -0.83038330078125, -0.782928466796875, -0.7354736328125, -0.688018798828125, -0.64056396484375, -0.593109130859375, -0.545654296875, -0.498199462890625, -0.45074462890625, -0.403289794921875, -0.3558349609375, -0.308380126953125, -0.26092529296875, -0.213470458984375, -0.166015625, -0.118560791015625, -0.07110595703125, -0.023651123046875, 0.0238037109375, 0.071258544921875, 0.11871337890625, 0.166168212890625, 0.213623046875, 0.261077880859375, 0.30853271484375, 0.355987548828125, 0.4034423828125, 0.450897216796875, 0.49835205078125, 0.545806884765625, 0.59326171875, 0.640716552734375, 0.68817138671875, 0.735626220703125, 0.7830810546875, 0.830535888671875, 0.87799072265625, 0.925445556640625, 0.972900390625, 1.020355224609375, 1.06781005859375, 1.115264892578125, 1.1627197265625, 1.210174560546875, 1.25762939453125, 1.305084228515625, 1.3525390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 7.0, 8.0, 6.0, 8.0, 12.0, 22.0, 18.0, 26.0, 20.0, 14.0, 34.0, 37.0, 40.0, 36.0, 49.0, 50.0, 39.0, 46.0, 45.0, 52.0, 53.0, 53.0, 40.0, 37.0, 43.0, 27.0, 30.0, 31.0, 16.0, 15.0, 13.0, 12.0, 11.0, 5.0, 6.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.921875, -4.77215576171875, -4.6224365234375, -4.47271728515625, -4.322998046875, -4.17327880859375, -4.0235595703125, -3.87384033203125, -3.72412109375, -3.57440185546875, -3.4246826171875, -3.27496337890625, -3.125244140625, -2.97552490234375, -2.8258056640625, -2.67608642578125, -2.5263671875, -2.37664794921875, -2.2269287109375, -2.07720947265625, -1.927490234375, -1.77777099609375, -1.6280517578125, -1.47833251953125, -1.32861328125, -1.17889404296875, -1.0291748046875, -0.87945556640625, -0.729736328125, -0.58001708984375, -0.4302978515625, -0.28057861328125, -0.130859375, 0.01885986328125, 0.1685791015625, 0.31829833984375, 0.468017578125, 0.61773681640625, 0.7674560546875, 0.91717529296875, 1.06689453125, 1.21661376953125, 1.3663330078125, 1.51605224609375, 1.665771484375, 1.81549072265625, 1.9652099609375, 2.11492919921875, 2.2646484375, 2.41436767578125, 2.5640869140625, 2.71380615234375, 2.863525390625, 3.01324462890625, 3.1629638671875, 3.31268310546875, 3.46240234375, 3.61212158203125, 3.7618408203125, 3.91156005859375, 4.061279296875, 4.21099853515625, 4.3607177734375, 4.51043701171875, 4.66015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 13.0, 12.0, 45.0, 71.0, 141.0, 343.0, 794.0, 2727.0, 13122.0, 274261.0, 722880.0, 27859.0, 4250.0, 1211.0, 440.0, 194.0, 82.0, 47.0, 32.0, 16.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5498046875, -1.5081024169921875, -1.466400146484375, -1.4246978759765625, -1.38299560546875, -1.3412933349609375, -1.299591064453125, -1.2578887939453125, -1.2161865234375, -1.1744842529296875, -1.132781982421875, -1.0910797119140625, -1.04937744140625, -1.0076751708984375, -0.965972900390625, -0.9242706298828125, -0.882568359375, -0.8408660888671875, -0.799163818359375, -0.7574615478515625, -0.71575927734375, -0.6740570068359375, -0.632354736328125, -0.5906524658203125, -0.5489501953125, -0.5072479248046875, -0.465545654296875, -0.4238433837890625, -0.38214111328125, -0.3404388427734375, -0.298736572265625, -0.2570343017578125, -0.21533203125, -0.1736297607421875, -0.131927490234375, -0.0902252197265625, -0.04852294921875, -0.0068206787109375, 0.034881591796875, 0.0765838623046875, 0.1182861328125, 0.1599884033203125, 0.201690673828125, 0.2433929443359375, 0.28509521484375, 0.3267974853515625, 0.368499755859375, 0.4102020263671875, 0.451904296875, 0.4936065673828125, 0.535308837890625, 0.5770111083984375, 0.61871337890625, 0.6604156494140625, 0.702117919921875, 0.7438201904296875, 0.7855224609375, 0.8272247314453125, 0.868927001953125, 0.9106292724609375, 0.95233154296875, 0.9940338134765625, 1.035736083984375, 1.0774383544921875, 1.119140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 16.0, 16.0, 32.0, 48.0, 90.0, 135.0, 175.0, 152.0, 140.0, 81.0, 49.0, 22.0, 19.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005588531494140625, -0.0005445331335067749, -0.0005302131175994873, -0.0005158931016921997, -0.0005015730857849121, -0.0004872530698776245, -0.0004729330539703369, -0.0004586130380630493, -0.0004442930221557617, -0.0004299730062484741, -0.0004156529903411865, -0.0004013329744338989, -0.00038701295852661133, -0.00037269294261932373, -0.00035837292671203613, -0.00034405291080474854, -0.00032973289489746094, -0.00031541287899017334, -0.00030109286308288574, -0.00028677284717559814, -0.00027245283126831055, -0.00025813281536102295, -0.00024381279945373535, -0.00022949278354644775, -0.00021517276763916016, -0.00020085275173187256, -0.00018653273582458496, -0.00017221271991729736, -0.00015789270401000977, -0.00014357268810272217, -0.00012925267219543457, -0.00011493265628814697, -0.00010061264038085938, -8.629262447357178e-05, -7.197260856628418e-05, -5.765259265899658e-05, -4.3332576751708984e-05, -2.9012560844421387e-05, -1.4692544937133789e-05, -3.725290298461914e-07, 1.3947486877441406e-05, 2.8267502784729004e-05, 4.25875186920166e-05, 5.69075345993042e-05, 7.12275505065918e-05, 8.55475664138794e-05, 9.986758232116699e-05, 0.00011418759822845459, 0.0001285076141357422, 0.00014282763004302979, 0.00015714764595031738, 0.00017146766185760498, 0.00018578767776489258, 0.00020010769367218018, 0.00021442770957946777, 0.00022874772548675537, 0.00024306774139404297, 0.00025738775730133057, 0.00027170777320861816, 0.00028602778911590576, 0.00030034780502319336, 0.00031466782093048096, 0.00032898783683776855, 0.00034330785274505615, 0.00035762786865234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 10.0, 5.0, 12.0, 15.0, 30.0, 31.0, 43.0, 50.0, 84.0, 107.0, 172.0, 213.0, 335.0, 514.0, 799.0, 1209.0, 2164.0, 3709.0, 7454.0, 15042.0, 34700.0, 88371.0, 230465.0, 348954.0, 188121.0, 71402.0, 28118.0, 12290.0, 5907.0, 3066.0, 1813.0, 1114.0, 715.0, 483.0, 278.0, 196.0, 159.0, 95.0, 66.0, 51.0, 41.0, 37.0, 29.0, 23.0, 12.0, 10.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0], "bins": [-0.38232421875, -0.37087249755859375, -0.3594207763671875, -0.34796905517578125, -0.336517333984375, -0.32506561279296875, -0.3136138916015625, -0.30216217041015625, -0.29071044921875, -0.27925872802734375, -0.2678070068359375, -0.25635528564453125, -0.244903564453125, -0.23345184326171875, -0.2220001220703125, -0.21054840087890625, -0.1990966796875, -0.18764495849609375, -0.1761932373046875, -0.16474151611328125, -0.153289794921875, -0.14183807373046875, -0.1303863525390625, -0.11893463134765625, -0.10748291015625, -0.09603118896484375, -0.0845794677734375, -0.07312774658203125, -0.061676025390625, -0.05022430419921875, -0.0387725830078125, -0.02732086181640625, -0.015869140625, -0.00441741943359375, 0.0070343017578125, 0.01848602294921875, 0.029937744140625, 0.04138946533203125, 0.0528411865234375, 0.06429290771484375, 0.07574462890625, 0.08719635009765625, 0.0986480712890625, 0.11009979248046875, 0.121551513671875, 0.13300323486328125, 0.1444549560546875, 0.15590667724609375, 0.1673583984375, 0.17881011962890625, 0.1902618408203125, 0.20171356201171875, 0.213165283203125, 0.22461700439453125, 0.2360687255859375, 0.24752044677734375, 0.25897216796875, 0.27042388916015625, 0.2818756103515625, 0.29332733154296875, 0.304779052734375, 0.31623077392578125, 0.3276824951171875, 0.33913421630859375, 0.3505859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 7.0, 4.0, 16.0, 21.0, 22.0, 33.0, 44.0, 64.0, 78.0, 88.0, 101.0, 116.0, 107.0, 68.0, 70.0, 38.0, 36.0, 23.0, 14.0, 11.0, 10.0, 4.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185546875, -0.1793537139892578, -0.17316055297851562, -0.16696739196777344, -0.16077423095703125, -0.15458106994628906, -0.14838790893554688, -0.1421947479248047, -0.1360015869140625, -0.1298084259033203, -0.12361526489257812, -0.11742210388183594, -0.11122894287109375, -0.10503578186035156, -0.09884262084960938, -0.09264945983886719, -0.086456298828125, -0.08026313781738281, -0.07406997680664062, -0.06787681579589844, -0.06168365478515625, -0.05549049377441406, -0.049297332763671875, -0.04310417175292969, -0.0369110107421875, -0.030717849731445312, -0.024524688720703125, -0.018331527709960938, -0.01213836669921875, -0.0059452056884765625, 0.000247955322265625, 0.0064411163330078125, 0.01263427734375, 0.018827438354492188, 0.025020599365234375, 0.031213760375976562, 0.03740692138671875, 0.04360008239746094, 0.049793243408203125, 0.05598640441894531, 0.0621795654296875, 0.06837272644042969, 0.07456588745117188, 0.08075904846191406, 0.08695220947265625, 0.09314537048339844, 0.09933853149414062, 0.10553169250488281, 0.111724853515625, 0.11791801452636719, 0.12411117553710938, 0.13030433654785156, 0.13649749755859375, 0.14269065856933594, 0.14888381958007812, 0.1550769805908203, 0.1612701416015625, 0.1674633026123047, 0.17365646362304688, 0.17984962463378906, 0.18604278564453125, 0.19223594665527344, 0.19842910766601562, 0.2046222686767578, 0.2108154296875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 9.0, 9.0, 9.0, 13.0, 17.0, 23.0, 38.0, 44.0, 56.0, 70.0, 85.0, 79.0, 85.0, 86.0, 83.0, 52.0, 52.0, 49.0, 30.0, 27.0, 18.0, 16.0, 17.0, 5.0, 14.0, 3.0, 7.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029763698577881, -1.9478716850280762, -1.8659796714782715, -1.7840876579284668, -1.702195644378662, -1.6203036308288574, -1.5384116172790527, -1.456519603729248, -1.3746275901794434, -1.2927355766296387, -1.210843563079834, -1.1289515495300293, -1.0470595359802246, -0.9651675224304199, -0.8832755088806152, -0.8013834953308105, -0.7194914817810059, -0.6375994682312012, -0.5557074546813965, -0.4738154411315918, -0.3919234275817871, -0.3100314140319824, -0.22813940048217773, -0.14624738693237305, -0.06435537338256836, 0.017536640167236328, 0.09942865371704102, 0.1813206672668457, 0.2632126808166504, 0.3451046943664551, 0.42699670791625977, 0.5088887214660645, 0.5907809734344482, 0.6726729869842529, 0.7545650005340576, 0.8364570140838623, 0.918349027633667, 1.0002410411834717, 1.0821330547332764, 1.164025068283081, 1.2459170818328857, 1.3278090953826904, 1.4097011089324951, 1.4915931224822998, 1.5734851360321045, 1.6553771495819092, 1.7372691631317139, 1.8191611766815186, 1.9010531902313232, 1.982945203781128, 2.0648372173309326, 2.1467292308807373, 2.228621244430542, 2.3105132579803467, 2.3924052715301514, 2.474297285079956, 2.5561892986297607, 2.6380813121795654, 2.71997332572937, 2.801865339279175, 2.8837573528289795, 2.965649366378784, 3.047541379928589, 3.1294333934783936, 3.2113254070281982]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 8.0, 5.0, 7.0, 10.0, 10.0, 22.0, 18.0, 21.0, 27.0, 30.0, 21.0, 35.0, 42.0, 45.0, 38.0, 44.0, 38.0, 42.0, 52.0, 28.0, 40.0, 52.0, 38.0, 33.0, 32.0, 44.0, 28.0, 23.0, 31.0, 28.0, 11.0, 22.0, 13.0, 6.0, 11.0, 8.0, 7.0, 8.0, 7.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5782090425491333, -1.5229995250701904, -1.4677900075912476, -1.4125804901123047, -1.3573710918426514, -1.3021615743637085, -1.2469520568847656, -1.1917425394058228, -1.1365330219268799, -1.081323504447937, -1.0261139869689941, -0.970904529094696, -0.915695071220398, -0.8604855537414551, -0.8052760362625122, -0.7500665187835693, -0.694857120513916, -0.6396476030349731, -0.584438145160675, -0.5292286276817322, -0.4740191400051117, -0.4188096523284912, -0.36360013484954834, -0.30839064717292786, -0.2531811594963074, -0.1979716718196869, -0.1427621692419052, -0.08755266666412354, -0.03234317898750305, 0.02286630868911743, 0.0780758261680603, 0.1332853138446808, 0.18849468231201172, 0.2437041699886322, 0.2989136576652527, 0.35412317514419556, 0.40933266282081604, 0.4645421504974365, 0.5197516679763794, 0.5749611854553223, 0.6301706433296204, 0.6853801608085632, 0.7405896186828613, 0.7957991361618042, 0.8510086536407471, 0.9062181115150452, 0.961427628993988, 1.0166370868682861, 1.071846604347229, 1.1270561218261719, 1.1822656393051147, 1.2374751567840576, 1.292684555053711, 1.3478940725326538, 1.4031035900115967, 1.4583131074905396, 1.5135226249694824, 1.5687321424484253, 1.6239416599273682, 1.6791510581970215, 1.7343605756759644, 1.7895700931549072, 1.84477961063385, 1.899989128112793, 1.9551985263824463]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 5.0, 6.0, 7.0, 12.0, 20.0, 34.0, 42.0, 54.0, 86.0, 138.0, 200.0, 369.0, 699.0, 1316.0, 2670.0, 5867.0, 13411.0, 32577.0, 87471.0, 294361.0, 413303.0, 120741.0, 43414.0, 17387.0, 7486.0, 3325.0, 1635.0, 812.0, 442.0, 221.0, 134.0, 97.0, 67.0, 34.0, 34.0, 10.0, 21.0, 6.0, 8.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.875946044921875, -2.77728271484375, -2.678619384765625, -2.5799560546875, -2.481292724609375, -2.38262939453125, -2.283966064453125, -2.185302734375, -2.086639404296875, -1.98797607421875, -1.889312744140625, -1.7906494140625, -1.691986083984375, -1.59332275390625, -1.494659423828125, -1.39599609375, -1.297332763671875, -1.19866943359375, -1.100006103515625, -1.0013427734375, -0.902679443359375, -0.80401611328125, -0.705352783203125, -0.606689453125, -0.508026123046875, -0.40936279296875, -0.310699462890625, -0.2120361328125, -0.113372802734375, -0.01470947265625, 0.083953857421875, 0.1826171875, 0.281280517578125, 0.37994384765625, 0.478607177734375, 0.5772705078125, 0.675933837890625, 0.77459716796875, 0.873260498046875, 0.971923828125, 1.070587158203125, 1.16925048828125, 1.267913818359375, 1.3665771484375, 1.465240478515625, 1.56390380859375, 1.662567138671875, 1.76123046875, 1.859893798828125, 1.95855712890625, 2.057220458984375, 2.1558837890625, 2.254547119140625, 2.35321044921875, 2.451873779296875, 2.550537109375, 2.649200439453125, 2.74786376953125, 2.846527099609375, 2.9451904296875, 3.043853759765625, 3.14251708984375, 3.241180419921875, 3.33984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 1.0, 5.0, 4.0, 5.0, 10.0, 11.0, 8.0, 15.0, 22.0, 13.0, 26.0, 25.0, 43.0, 31.0, 25.0, 40.0, 39.0, 46.0, 44.0, 50.0, 43.0, 42.0, 45.0, 40.0, 39.0, 36.0, 36.0, 32.0, 31.0, 26.0, 29.0, 29.0, 22.0, 15.0, 16.0, 18.0, 3.0, 7.0, 10.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.072265625, -2.97308349609375, -2.8739013671875, -2.77471923828125, -2.675537109375, -2.57635498046875, -2.4771728515625, -2.37799072265625, -2.27880859375, -2.17962646484375, -2.0804443359375, -1.98126220703125, -1.882080078125, -1.78289794921875, -1.6837158203125, -1.58453369140625, -1.4853515625, -1.38616943359375, -1.2869873046875, -1.18780517578125, -1.088623046875, -0.98944091796875, -0.8902587890625, -0.79107666015625, -0.69189453125, -0.59271240234375, -0.4935302734375, -0.39434814453125, -0.295166015625, -0.19598388671875, -0.0968017578125, 0.00238037109375, 0.1015625, 0.20074462890625, 0.2999267578125, 0.39910888671875, 0.498291015625, 0.59747314453125, 0.6966552734375, 0.79583740234375, 0.89501953125, 0.99420166015625, 1.0933837890625, 1.19256591796875, 1.291748046875, 1.39093017578125, 1.4901123046875, 1.58929443359375, 1.6884765625, 1.78765869140625, 1.8868408203125, 1.98602294921875, 2.085205078125, 2.18438720703125, 2.2835693359375, 2.38275146484375, 2.48193359375, 2.58111572265625, 2.6802978515625, 2.77947998046875, 2.878662109375, 2.97784423828125, 3.0770263671875, 3.17620849609375, 3.275390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 7.0, 15.0, 24.0, 28.0, 29.0, 48.0, 86.0, 110.0, 187.0, 315.0, 608.0, 1382.0, 3259.0, 8458.0, 23785.0, 74124.0, 286278.0, 466461.0, 124995.0, 36844.0, 12853.0, 4798.0, 1902.0, 853.0, 399.0, 244.0, 153.0, 75.0, 66.0, 41.0, 25.0, 22.0, 15.0, 13.0, 9.0, 11.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.689453125, -3.57489013671875, -3.4603271484375, -3.34576416015625, -3.231201171875, -3.11663818359375, -3.0020751953125, -2.88751220703125, -2.77294921875, -2.65838623046875, -2.5438232421875, -2.42926025390625, -2.314697265625, -2.20013427734375, -2.0855712890625, -1.97100830078125, -1.8564453125, -1.74188232421875, -1.6273193359375, -1.51275634765625, -1.398193359375, -1.28363037109375, -1.1690673828125, -1.05450439453125, -0.93994140625, -0.82537841796875, -0.7108154296875, -0.59625244140625, -0.481689453125, -0.36712646484375, -0.2525634765625, -0.13800048828125, -0.0234375, 0.09112548828125, 0.2056884765625, 0.32025146484375, 0.434814453125, 0.54937744140625, 0.6639404296875, 0.77850341796875, 0.89306640625, 1.00762939453125, 1.1221923828125, 1.23675537109375, 1.351318359375, 1.46588134765625, 1.5804443359375, 1.69500732421875, 1.8095703125, 1.92413330078125, 2.0386962890625, 2.15325927734375, 2.267822265625, 2.38238525390625, 2.4969482421875, 2.61151123046875, 2.72607421875, 2.84063720703125, 2.9552001953125, 3.06976318359375, 3.184326171875, 3.29888916015625, 3.4134521484375, 3.52801513671875, 3.642578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 10.0, 11.0, 16.0, 9.0, 23.0, 20.0, 31.0, 28.0, 28.0, 45.0, 38.0, 39.0, 53.0, 36.0, 63.0, 57.0, 52.0, 48.0, 46.0, 45.0, 36.0, 43.0, 44.0, 24.0, 25.0, 16.0, 15.0, 14.0, 15.0, 8.0, 7.0, 11.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.52734375, -4.39605712890625, -4.2647705078125, -4.13348388671875, -4.002197265625, -3.87091064453125, -3.7396240234375, -3.60833740234375, -3.47705078125, -3.34576416015625, -3.2144775390625, -3.08319091796875, -2.951904296875, -2.82061767578125, -2.6893310546875, -2.55804443359375, -2.4267578125, -2.29547119140625, -2.1641845703125, -2.03289794921875, -1.901611328125, -1.77032470703125, -1.6390380859375, -1.50775146484375, -1.37646484375, -1.24517822265625, -1.1138916015625, -0.98260498046875, -0.851318359375, -0.72003173828125, -0.5887451171875, -0.45745849609375, -0.326171875, -0.19488525390625, -0.0635986328125, 0.06768798828125, 0.198974609375, 0.33026123046875, 0.4615478515625, 0.59283447265625, 0.72412109375, 0.85540771484375, 0.9866943359375, 1.11798095703125, 1.249267578125, 1.38055419921875, 1.5118408203125, 1.64312744140625, 1.7744140625, 1.90570068359375, 2.0369873046875, 2.16827392578125, 2.299560546875, 2.43084716796875, 2.5621337890625, 2.69342041015625, 2.82470703125, 2.95599365234375, 3.0872802734375, 3.21856689453125, 3.349853515625, 3.48114013671875, 3.6124267578125, 3.74371337890625, 3.875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 12.0, 21.0, 24.0, 30.0, 51.0, 68.0, 102.0, 145.0, 247.0, 362.0, 668.0, 1035.0, 1972.0, 3808.0, 7417.0, 14932.0, 32873.0, 81396.0, 221369.0, 406505.0, 163429.0, 61023.0, 25852.0, 12088.0, 6050.0, 3123.0, 1600.0, 915.0, 516.0, 291.0, 205.0, 132.0, 73.0, 66.0, 39.0, 33.0, 19.0, 13.0, 16.0, 3.0, 5.0, 7.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5044174194335938, -0.4883270263671875, -0.47223663330078125, -0.456146240234375, -0.44005584716796875, -0.4239654541015625, -0.40787506103515625, -0.39178466796875, -0.37569427490234375, -0.3596038818359375, -0.34351348876953125, -0.327423095703125, -0.31133270263671875, -0.2952423095703125, -0.27915191650390625, -0.2630615234375, -0.24697113037109375, -0.2308807373046875, -0.21479034423828125, -0.198699951171875, -0.18260955810546875, -0.1665191650390625, -0.15042877197265625, -0.13433837890625, -0.11824798583984375, -0.1021575927734375, -0.08606719970703125, -0.069976806640625, -0.05388641357421875, -0.0377960205078125, -0.02170562744140625, -0.005615234375, 0.01047515869140625, 0.0265655517578125, 0.04265594482421875, 0.058746337890625, 0.07483673095703125, 0.0909271240234375, 0.10701751708984375, 0.12310791015625, 0.13919830322265625, 0.1552886962890625, 0.17137908935546875, 0.187469482421875, 0.20355987548828125, 0.2196502685546875, 0.23574066162109375, 0.2518310546875, 0.26792144775390625, 0.2840118408203125, 0.30010223388671875, 0.316192626953125, 0.33228302001953125, 0.3483734130859375, 0.36446380615234375, 0.38055419921875, 0.39664459228515625, 0.4127349853515625, 0.42882537841796875, 0.444915771484375, 0.46100616455078125, 0.4770965576171875, 0.49318695068359375, 0.50927734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 9.0, 7.0, 11.0, 16.0, 12.0, 21.0, 24.0, 38.0, 38.0, 47.0, 54.0, 62.0, 89.0, 93.0, 91.0, 61.0, 61.0, 50.0, 40.0, 38.0, 31.0, 20.0, 18.0, 16.0, 7.0, 10.0, 5.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00014019012451171875, -0.0001363418996334076, -0.00013249367475509644, -0.00012864544987678528, -0.00012479722499847412, -0.00012094900012016296, -0.0001171007752418518, -0.00011325255036354065, -0.00010940432548522949, -0.00010555610060691833, -0.00010170787572860718, -9.785965085029602e-05, -9.401142597198486e-05, -9.01632010936737e-05, -8.631497621536255e-05, -8.246675133705139e-05, -7.861852645874023e-05, -7.477030158042908e-05, -7.092207670211792e-05, -6.707385182380676e-05, -6.32256269454956e-05, -5.937740206718445e-05, -5.552917718887329e-05, -5.1680952310562134e-05, -4.7832727432250977e-05, -4.398450255393982e-05, -4.013627767562866e-05, -3.6288052797317505e-05, -3.243982791900635e-05, -2.859160304069519e-05, -2.4743378162384033e-05, -2.0895153284072876e-05, -1.704692840576172e-05, -1.3198703527450562e-05, -9.350478649139404e-06, -5.502253770828247e-06, -1.6540288925170898e-06, 2.1941959857940674e-06, 6.042420864105225e-06, 9.890645742416382e-06, 1.3738870620727539e-05, 1.7587095499038696e-05, 2.1435320377349854e-05, 2.528354525566101e-05, 2.9131770133972168e-05, 3.2979995012283325e-05, 3.682821989059448e-05, 4.067644476890564e-05, 4.45246696472168e-05, 4.8372894525527954e-05, 5.222111940383911e-05, 5.606934428215027e-05, 5.9917569160461426e-05, 6.376579403877258e-05, 6.761401891708374e-05, 7.14622437953949e-05, 7.531046867370605e-05, 7.915869355201721e-05, 8.300691843032837e-05, 8.685514330863953e-05, 9.070336818695068e-05, 9.455159306526184e-05, 9.8399817943573e-05, 0.00010224804282188416, 0.00010609626770019531]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 7.0, 6.0, 11.0, 9.0, 14.0, 14.0, 27.0, 31.0, 31.0, 67.0, 78.0, 111.0, 141.0, 242.0, 336.0, 528.0, 972.0, 1640.0, 2960.0, 6051.0, 13379.0, 32574.0, 91542.0, 304071.0, 404844.0, 117458.0, 39958.0, 16041.0, 7228.0, 3425.0, 1812.0, 1022.0, 626.0, 428.0, 280.0, 170.0, 115.0, 81.0, 63.0, 52.0, 24.0, 24.0, 21.0, 12.0, 11.0, 8.0, 8.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.78857421875, -0.7647552490234375, -0.740936279296875, -0.7171173095703125, -0.69329833984375, -0.6694793701171875, -0.645660400390625, -0.6218414306640625, -0.5980224609375, -0.5742034912109375, -0.550384521484375, -0.5265655517578125, -0.50274658203125, -0.4789276123046875, -0.455108642578125, -0.4312896728515625, -0.407470703125, -0.3836517333984375, -0.359832763671875, -0.3360137939453125, -0.31219482421875, -0.2883758544921875, -0.264556884765625, -0.2407379150390625, -0.2169189453125, -0.1930999755859375, -0.169281005859375, -0.1454620361328125, -0.12164306640625, -0.0978240966796875, -0.074005126953125, -0.0501861572265625, -0.0263671875, -0.0025482177734375, 0.021270751953125, 0.0450897216796875, 0.06890869140625, 0.0927276611328125, 0.116546630859375, 0.1403656005859375, 0.1641845703125, 0.1880035400390625, 0.211822509765625, 0.2356414794921875, 0.25946044921875, 0.2832794189453125, 0.307098388671875, 0.3309173583984375, 0.354736328125, 0.3785552978515625, 0.402374267578125, 0.4261932373046875, 0.45001220703125, 0.4738311767578125, 0.497650146484375, 0.5214691162109375, 0.5452880859375, 0.5691070556640625, 0.592926025390625, 0.6167449951171875, 0.64056396484375, 0.6643829345703125, 0.688201904296875, 0.7120208740234375, 0.73583984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 7.0, 15.0, 29.0, 36.0, 35.0, 55.0, 91.0, 118.0, 141.0, 119.0, 112.0, 73.0, 52.0, 20.0, 21.0, 20.0, 12.0, 5.0, 5.0, 8.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.75341796875, -0.7329635620117188, -0.7125091552734375, -0.6920547485351562, -0.671600341796875, -0.6511459350585938, -0.6306915283203125, -0.6102371215820312, -0.58978271484375, -0.5693283081054688, -0.5488739013671875, -0.5284194946289062, -0.507965087890625, -0.48751068115234375, -0.4670562744140625, -0.44660186767578125, -0.4261474609375, -0.40569305419921875, -0.3852386474609375, -0.36478424072265625, -0.344329833984375, -0.32387542724609375, -0.3034210205078125, -0.28296661376953125, -0.26251220703125, -0.24205780029296875, -0.2216033935546875, -0.20114898681640625, -0.180694580078125, -0.16024017333984375, -0.1397857666015625, -0.11933135986328125, -0.098876953125, -0.07842254638671875, -0.0579681396484375, -0.03751373291015625, -0.017059326171875, 0.00339508056640625, 0.0238494873046875, 0.04430389404296875, 0.06475830078125, 0.08521270751953125, 0.1056671142578125, 0.12612152099609375, 0.146575927734375, 0.16703033447265625, 0.1874847412109375, 0.20793914794921875, 0.2283935546875, 0.24884796142578125, 0.2693023681640625, 0.28975677490234375, 0.310211181640625, 0.33066558837890625, 0.3511199951171875, 0.37157440185546875, 0.39202880859375, 0.41248321533203125, 0.4329376220703125, 0.45339202880859375, 0.473846435546875, 0.49430084228515625, 0.5147552490234375, 0.5352096557617188, 0.5556640625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 19.0, 26.0, 61.0, 100.0, 151.0, 157.0, 174.0, 133.0, 75.0, 43.0, 26.0, 14.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6573333740234375, -7.322300910949707, -6.987267971038818, -6.652235507965088, -6.317202568054199, -5.982170104980469, -5.647137641906738, -5.312105178833008, -4.977072238922119, -4.642039775848389, -4.3070068359375, -3.9719743728637695, -3.63694167137146, -3.3019089698791504, -2.96687650680542, -2.6318438053131104, -2.296811103820801, -1.9617784023284912, -1.6267458200454712, -1.2917132377624512, -0.9566805362701416, -0.621647834777832, -0.28661537170410156, 0.04841732978820801, 0.3834500312805176, 0.7184826731681824, 1.0535153150558472, 1.3885478973388672, 1.7235805988311768, 2.0586133003234863, 2.393645763397217, 2.7286784648895264, 3.063711166381836, 3.3987438678741455, 3.733776569366455, 4.0688090324401855, 4.403841972351074, 4.738874435424805, 5.073906898498535, 5.408939361572266, 5.743972301483154, 6.079004764556885, 6.414037704467773, 6.749070167541504, 7.084102630615234, 7.419135570526123, 7.7541680335998535, 8.089200973510742, 8.424233436584473, 8.759265899658203, 9.094298362731934, 9.429330825805664, 9.764364242553711, 10.099396705627441, 10.434429168701172, 10.769461631774902, 11.104494094848633, 11.439526557922363, 11.774559020996094, 12.10959243774414, 12.444624900817871, 12.779657363891602, 13.114689826965332, 13.449722290039062, 13.78475570678711]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 2.0, 5.0, 5.0, 4.0, 10.0, 7.0, 16.0, 18.0, 15.0, 21.0, 26.0, 21.0, 29.0, 36.0, 28.0, 36.0, 23.0, 37.0, 39.0, 36.0, 32.0, 47.0, 37.0, 44.0, 42.0, 33.0, 27.0, 42.0, 32.0, 40.0, 27.0, 31.0, 16.0, 15.0, 27.0, 8.0, 18.0, 10.0, 11.0, 8.0, 13.0, 8.0, 2.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.685919284820557, -5.5085272789001465, -5.3311357498168945, -5.153743743896484, -4.976351737976074, -4.798959732055664, -4.621567726135254, -4.444176197052002, -4.266784191131592, -4.089392185211182, -3.9120004177093506, -3.7346086502075195, -3.5572166442871094, -3.379824638366699, -3.202432870864868, -3.025041103363037, -2.847649097442627, -2.670257091522217, -2.4928653240203857, -2.3154735565185547, -2.1380815505981445, -1.960689663887024, -1.7832977771759033, -1.6059058904647827, -1.428514003753662, -1.2511221170425415, -1.073730230331421, -0.8963383436203003, -0.7189464569091797, -0.5415545701980591, -0.3641626834869385, -0.18677079677581787, -0.009379386901855469, 0.16801249980926514, 0.34540438652038574, 0.5227962732315063, 0.700188159942627, 0.8775800466537476, 1.0549719333648682, 1.2323638200759888, 1.4097557067871094, 1.58714759349823, 1.7645394802093506, 1.9419313669204712, 2.119323253631592, 2.296715259552002, 2.474107027053833, 2.651498794555664, 2.828890800476074, 3.0062828063964844, 3.1836745738983154, 3.3610663414001465, 3.5384583473205566, 3.715850353240967, 3.893242120742798, 4.070633888244629, 4.248025894165039, 4.425417900085449, 4.602809906005859, 4.780201435089111, 4.9575934410095215, 5.134985446929932, 5.312376976013184, 5.489768981933594, 5.667160987854004]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 11.0, 13.0, 25.0, 15.0, 29.0, 38.0, 42.0, 65.0, 99.0, 81.0, 109.0, 144.0, 182.0, 226.0, 287.0, 382.0, 442.0, 549.0, 739.0, 1139.0, 1041031.0, 1250.0, 842.0, 567.0, 474.0, 383.0, 301.0, 235.0, 184.0, 165.0, 110.0, 91.0, 89.0, 66.0, 41.0, 32.0, 30.0, 17.0, 20.0, 18.0, 10.0, 8.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.7618536949157715, -7.51632022857666, -7.270786285400391, -7.025252819061279, -6.779719352722168, -6.534185409545898, -6.288651943206787, -6.043118476867676, -5.7975850105285645, -5.552051544189453, -5.306517601013184, -5.060984134674072, -4.815450668334961, -4.569916725158691, -4.32438325881958, -4.078849792480469, -3.8333160877227783, -3.587782382965088, -3.3422489166259766, -3.096715211868286, -2.851181745529175, -2.6056480407714844, -2.360114574432373, -2.1145808696746826, -1.8690472841262817, -1.6235136985778809, -1.37798011302948, -1.132446527481079, -0.8869128823280334, -0.6413792371749878, -0.3958456516265869, -0.15031206607818604, 0.09522151947021484, 0.3407551050186157, 0.5862886905670166, 0.8318223357200623, 1.0773558616638184, 1.3228895664215088, 1.5684231519699097, 1.8139567375183105, 2.059490203857422, 2.3050239086151123, 2.5505573749542236, 2.796091079711914, 3.0416245460510254, 3.287158250808716, 3.5326919555664062, 3.7782254219055176, 4.023758888244629, 4.26929235458374, 4.51482629776001, 4.760359764099121, 5.005893230438232, 5.251426696777344, 5.496960639953613, 5.742494106292725, 5.988028049468994, 6.2335615158081055, 6.479095458984375, 6.724628925323486, 6.970162391662598, 7.215696334838867, 7.4612298011779785, 7.70676326751709, 7.952296733856201]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 14.0, 24.0, 51.0, 88.0, 298.0, 876.0, 2495.0, 8633.0, 51432112.0, 19684.0, 4545.0, 1590.0, 566.0, 183.0, 83.0, 33.0, 10.0, 10.0, 9.0, 3.0, 4.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.9190673828125, -64.31858825683594, -61.71810531616211, -59.11762237548828, -56.51714324951172, -53.91666030883789, -51.31617736816406, -48.7156982421875, -46.11521911621094, -43.51473617553711, -40.91425704956055, -38.31377410888672, -35.713294982910156, -33.11281204223633, -30.512331008911133, -27.911849975585938, -25.31136703491211, -22.710886001586914, -20.11040496826172, -17.50992202758789, -14.909441947937012, -12.308960914611816, -9.708478927612305, -7.107997894287109, -4.507516860961914, -1.9070355892181396, 0.6934456825256348, 3.2939271926879883, 5.894408226013184, 8.494889259338379, 11.09537124633789, 13.695852279663086, 16.29633331298828, 18.896814346313477, 21.497295379638672, 24.0977783203125, 26.698257446289062, 29.29874038696289, 31.899221420288086, 34.49970245361328, 37.100181579589844, 39.70066452026367, 42.301143646240234, 44.90162658691406, 47.502105712890625, 50.10258865356445, 52.70307159423828, 55.303550720214844, 57.90403366088867, 60.5045166015625, 63.10499572753906, 65.70547485351562, 68.30596160888672, 70.90644073486328, 73.50691986083984, 76.10740661621094, 78.7078857421875, 81.30836486816406, 83.90885162353516, 86.50933074951172, 89.10980987548828, 91.71028900146484, 94.31077575683594, 96.9112548828125, 99.51173400878906]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 8.0, 9.0, 14.0, 20.0, 32.0, 52.0, 104.0, 137.0, 257.0, 432.0, 797.0, 1439.0, 2847.0, 5296.0, 10457.0, 20563.0, 42282.0, 85533.0, 164565.0, 296450.0, 492685.0, 2642651.0, 1543378.0, 434078.0, 260250.0, 142409.0, 72752.0, 35519.0, 17572.0, 8801.0, 4545.0, 2382.0, 1298.0, 753.0, 389.0, 222.0, 154.0, 92.0, 56.0, 41.0, 23.0, 24.0, 13.0, 18.0, 12.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.515625, -5.32464599609375, -5.1336669921875, -4.94268798828125, -4.751708984375, -4.56072998046875, -4.3697509765625, -4.17877197265625, -3.98779296875, -3.79681396484375, -3.6058349609375, -3.41485595703125, -3.223876953125, -3.03289794921875, -2.8419189453125, -2.65093994140625, -2.4599609375, -2.26898193359375, -2.0780029296875, -1.88702392578125, -1.696044921875, -1.50506591796875, -1.3140869140625, -1.12310791015625, -0.93212890625, -0.74114990234375, -0.5501708984375, -0.35919189453125, -0.168212890625, 0.02276611328125, 0.2137451171875, 0.40472412109375, 0.595703125, 0.78668212890625, 0.9776611328125, 1.16864013671875, 1.359619140625, 1.55059814453125, 1.7415771484375, 1.93255615234375, 2.12353515625, 2.31451416015625, 2.5054931640625, 2.69647216796875, 2.887451171875, 3.07843017578125, 3.2694091796875, 3.46038818359375, 3.6513671875, 3.84234619140625, 4.0333251953125, 4.22430419921875, 4.415283203125, 4.60626220703125, 4.7972412109375, 4.98822021484375, 5.17919921875, 5.37017822265625, 5.5611572265625, 5.75213623046875, 5.943115234375, 6.13409423828125, 6.3250732421875, 6.51605224609375, 6.70703125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 18.0, 14.0, 18.0, 19.0, 16.0, 26.0, 24.0, 29.0, 28.0, 35.0, 36.0, 41.0, 43.0, 39.0, 66.0, 180.0, 700.0, 224.0, 61.0, 35.0, 40.0, 47.0, 36.0, 26.0, 35.0, 20.0, 21.0, 22.0, 15.0, 10.0, 13.0, 21.0, 9.0, 5.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -31.984375, -30.9375, -29.890625, -28.84375, -27.796875, -26.75, -25.703125, -24.65625, -23.609375, -22.5625, -21.515625, -20.46875, -19.421875, -18.375, -17.328125, -16.28125, -15.234375, -14.1875, -13.140625, -12.09375, -11.046875, -10.0, -8.953125, -7.90625, -6.859375, -5.8125, -4.765625, -3.71875, -2.671875, -1.625, -0.578125, 0.46875, 1.515625, 2.5625, 3.609375, 4.65625, 5.703125, 6.75, 7.796875, 8.84375, 9.890625, 10.9375, 11.984375, 13.03125, 14.078125, 15.125, 16.171875, 17.21875, 18.265625, 19.3125, 20.359375, 21.40625, 22.453125, 23.5, 24.546875, 25.59375, 26.640625, 27.6875, 28.734375, 29.78125, 30.828125, 31.875, 32.921875, 33.96875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 12.0, 20.0, 47.0, 61.0, 150.0, 198.0, 346.0, 641.0, 1042.0, 1665.0, 2894.0, 4665.0, 7971.0, 13318.0, 21293.0, 33976.0, 53548.0, 79893.0, 118400.0, 164815.0, 217136.0, 269822.0, 414418.0, 2275983.0, 1380301.0, 329739.0, 253589.0, 199613.0, 149268.0, 104917.0, 70572.0, 46087.0, 29114.0, 17907.0, 11106.0, 6684.0, 4093.0, 2445.0, 1466.0, 908.0, 491.0, 344.0, 198.0, 120.0, 55.0, 44.0, 16.0, 15.0, 11.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.5625, -2.47662353515625, -2.3907470703125, -2.30487060546875, -2.218994140625, -2.13311767578125, -2.0472412109375, -1.96136474609375, -1.87548828125, -1.78961181640625, -1.7037353515625, -1.61785888671875, -1.531982421875, -1.44610595703125, -1.3602294921875, -1.27435302734375, -1.1884765625, -1.10260009765625, -1.0167236328125, -0.93084716796875, -0.844970703125, -0.75909423828125, -0.6732177734375, -0.58734130859375, -0.50146484375, -0.41558837890625, -0.3297119140625, -0.24383544921875, -0.157958984375, -0.07208251953125, 0.0137939453125, 0.09967041015625, 0.185546875, 0.27142333984375, 0.3572998046875, 0.44317626953125, 0.529052734375, 0.61492919921875, 0.7008056640625, 0.78668212890625, 0.87255859375, 0.95843505859375, 1.0443115234375, 1.13018798828125, 1.216064453125, 1.30194091796875, 1.3878173828125, 1.47369384765625, 1.5595703125, 1.64544677734375, 1.7313232421875, 1.81719970703125, 1.903076171875, 1.98895263671875, 2.0748291015625, 2.16070556640625, 2.24658203125, 2.33245849609375, 2.4183349609375, 2.50421142578125, 2.590087890625, 2.67596435546875, 2.7618408203125, 2.84771728515625, 2.93359375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 10.0, 11.0, 13.0, 11.0, 13.0, 11.0, 21.0, 23.0, 13.0, 15.0, 24.0, 16.0, 26.0, 22.0, 31.0, 37.0, 32.0, 35.0, 41.0, 53.0, 285.0, 661.0, 162.0, 44.0, 27.0, 34.0, 33.0, 35.0, 32.0, 35.0, 23.0, 23.0, 33.0, 22.0, 15.0, 22.0, 19.0, 10.0, 9.0, 9.0, 6.0, 8.0, 5.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-21.265625, -20.589599609375, -19.91357421875, -19.237548828125, -18.5615234375, -17.885498046875, -17.20947265625, -16.533447265625, -15.857421875, -15.181396484375, -14.50537109375, -13.829345703125, -13.1533203125, -12.477294921875, -11.80126953125, -11.125244140625, -10.44921875, -9.773193359375, -9.09716796875, -8.421142578125, -7.7451171875, -7.069091796875, -6.39306640625, -5.717041015625, -5.041015625, -4.364990234375, -3.68896484375, -3.012939453125, -2.3369140625, -1.660888671875, -0.98486328125, -0.308837890625, 0.3671875, 1.043212890625, 1.71923828125, 2.395263671875, 3.0712890625, 3.747314453125, 4.42333984375, 5.099365234375, 5.775390625, 6.451416015625, 7.12744140625, 7.803466796875, 8.4794921875, 9.155517578125, 9.83154296875, 10.507568359375, 11.18359375, 11.859619140625, 12.53564453125, 13.211669921875, 13.8876953125, 14.563720703125, 15.23974609375, 15.915771484375, 16.591796875, 17.267822265625, 17.94384765625, 18.619873046875, 19.2958984375, 19.971923828125, 20.64794921875, 21.323974609375, 22.0]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 14.0, 26.0, 33.0, 46.0, 67.0, 91.0, 129.0, 211.0, 335.0, 474.0, 749.0, 1274.0, 2379.0, 4708.0, 10972.0, 31234.0, 92321.0, 264714.0, 625188.0, 3997940.0, 751723.0, 325497.0, 116300.0, 39337.0, 13829.0, 5552.0, 2623.0, 1396.0, 774.0, 490.0, 324.0, 200.0, 140.0, 84.0, 56.0, 60.0, 32.0, 32.0, 22.0, 22.0, 8.0, 4.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.34765625, -7.122314453125, -6.89697265625, -6.671630859375, -6.4462890625, -6.220947265625, -5.99560546875, -5.770263671875, -5.544921875, -5.319580078125, -5.09423828125, -4.868896484375, -4.6435546875, -4.418212890625, -4.19287109375, -3.967529296875, -3.7421875, -3.516845703125, -3.29150390625, -3.066162109375, -2.8408203125, -2.615478515625, -2.39013671875, -2.164794921875, -1.939453125, -1.714111328125, -1.48876953125, -1.263427734375, -1.0380859375, -0.812744140625, -0.58740234375, -0.362060546875, -0.13671875, 0.088623046875, 0.31396484375, 0.539306640625, 0.7646484375, 0.989990234375, 1.21533203125, 1.440673828125, 1.666015625, 1.891357421875, 2.11669921875, 2.342041015625, 2.5673828125, 2.792724609375, 3.01806640625, 3.243408203125, 3.46875, 3.694091796875, 3.91943359375, 4.144775390625, 4.3701171875, 4.595458984375, 4.82080078125, 5.046142578125, 5.271484375, 5.496826171875, 5.72216796875, 5.947509765625, 6.1728515625, 6.398193359375, 6.62353515625, 6.848876953125, 7.07421875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 15.0, 12.0, 17.0, 12.0, 15.0, 24.0, 23.0, 38.0, 30.0, 43.0, 44.0, 38.0, 38.0, 43.0, 89.0, 603.0, 459.0, 64.0, 40.0, 43.0, 39.0, 40.0, 31.0, 31.0, 30.0, 32.0, 27.0, 19.0, 16.0, 10.0, 3.0, 11.0, 7.0, 8.0, 4.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.3125, -23.500732421875, -22.68896484375, -21.877197265625, -21.0654296875, -20.253662109375, -19.44189453125, -18.630126953125, -17.818359375, -17.006591796875, -16.19482421875, -15.383056640625, -14.5712890625, -13.759521484375, -12.94775390625, -12.135986328125, -11.32421875, -10.512451171875, -9.70068359375, -8.888916015625, -8.0771484375, -7.265380859375, -6.45361328125, -5.641845703125, -4.830078125, -4.018310546875, -3.20654296875, -2.394775390625, -1.5830078125, -0.771240234375, 0.04052734375, 0.852294921875, 1.6640625, 2.475830078125, 3.28759765625, 4.099365234375, 4.9111328125, 5.722900390625, 6.53466796875, 7.346435546875, 8.158203125, 8.969970703125, 9.78173828125, 10.593505859375, 11.4052734375, 12.217041015625, 13.02880859375, 13.840576171875, 14.65234375, 15.464111328125, 16.27587890625, 17.087646484375, 17.8994140625, 18.711181640625, 19.52294921875, 20.334716796875, 21.146484375, 21.958251953125, 22.77001953125, 23.581787109375, 24.3935546875, 25.205322265625, 26.01708984375, 26.828857421875, 27.640625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 10.0, 20.0, 53.0, 229.0, 444.0, 188.0, 39.0, 19.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.37144470214844, -80.42475891113281, -74.47806549072266, -68.53137969970703, -62.58469009399414, -56.63800048828125, -50.691314697265625, -44.744625091552734, -38.797935485839844, -32.85124588012695, -26.904558181762695, -20.957870483398438, -15.011180877685547, -9.064491271972656, -3.1178054809570312, 2.8288841247558594, 8.77557373046875, 14.722262382507324, 20.6689510345459, 26.615638732910156, 32.56232833862305, 38.50901794433594, 44.45570373535156, 50.40239334106445, 56.349082946777344, 62.295772552490234, 68.24246215820312, 74.18914794921875, 80.13583374023438, 86.08252716064453, 92.02921295166016, 97.97590637207031, 103.92257690429688, 109.8692626953125, 115.81595611572266, 121.76264190673828, 127.70933532714844, 133.65602111816406, 139.6027069091797, 145.5493927001953, 151.49609375, 157.44277954101562, 163.38946533203125, 169.33615112304688, 175.28285217285156, 181.2295379638672, 187.1762237548828, 193.12290954589844, 199.06959533691406, 205.0162811279297, 210.9629669189453, 216.90966796875, 222.85635375976562, 228.80303955078125, 234.74972534179688, 240.6964111328125, 246.64309692382812, 252.58978271484375, 258.5364685058594, 264.483154296875, 270.4298400878906, 276.37652587890625, 282.3232421875, 288.2699279785156, 294.21661376953125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 2.0, 2.0, 9.0, 18.0, 14.0, 16.0, 19.0, 29.0, 38.0, 23.0, 42.0, 52.0, 39.0, 46.0, 61.0, 46.0, 42.0, 49.0, 47.0, 60.0, 47.0, 49.0, 31.0, 36.0, 38.0, 26.0, 16.0, 20.0, 14.0, 10.0, 11.0, 14.0, 11.0, 1.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.63560485839844, -55.57374572753906, -53.51188278198242, -51.45002365112305, -49.388160705566406, -47.32630157470703, -45.264442443847656, -43.202579498291016, -41.140716552734375, -39.078857421875, -37.01699447631836, -34.955135345458984, -32.893272399902344, -30.83141326904297, -28.76955223083496, -26.707691192626953, -24.645832061767578, -22.58397102355957, -20.522109985351562, -18.460250854492188, -16.398387908935547, -14.336527824401855, -12.274667739868164, -10.212806701660156, -8.150945663452148, -6.089084625244141, -4.027224063873291, -1.9653635025024414, 0.0964975357055664, 2.158358573913574, 4.220218658447266, 6.282079696655273, 8.343940734863281, 10.405801773071289, 12.467662811279297, 14.529522895812988, 16.591384887695312, 18.653244018554688, 20.715105056762695, 22.776966094970703, 24.83882713317871, 26.90068817138672, 28.962549209594727, 31.024410247802734, 33.08626937866211, 35.14813232421875, 37.209991455078125, 39.2718505859375, 41.33371353149414, 43.395572662353516, 45.457435607910156, 47.51929473876953, 49.58115768432617, 51.64301681518555, 53.70487976074219, 55.76673889160156, 57.82859802246094, 59.89045715332031, 61.95232009887695, 64.0141830444336, 66.07604217529297, 68.13790130615234, 70.19976043701172, 72.26162719726562, 74.323486328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 10.0, 5.0, 8.0, 11.0, 14.0, 8.0, 12.0, 16.0, 29.0, 42.0, 72.0, 109.0, 230.0, 324.0, 675.0, 1278.0, 2893.0, 7063.0, 22535.0, 183054.0, 2766829.0, 1122707.0, 62930.0, 14170.0, 5101.0, 2049.0, 984.0, 435.0, 228.0, 147.0, 90.0, 46.0, 48.0, 32.0, 29.0, 14.0, 17.0, 5.0, 10.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.2978515625, -1.258270263671875, -1.21868896484375, -1.179107666015625, -1.1395263671875, -1.099945068359375, -1.06036376953125, -1.020782470703125, -0.981201171875, -0.941619873046875, -0.90203857421875, -0.862457275390625, -0.8228759765625, -0.783294677734375, -0.74371337890625, -0.704132080078125, -0.66455078125, -0.624969482421875, -0.58538818359375, -0.545806884765625, -0.5062255859375, -0.466644287109375, -0.42706298828125, -0.387481689453125, -0.347900390625, -0.308319091796875, -0.26873779296875, -0.229156494140625, -0.1895751953125, -0.149993896484375, -0.11041259765625, -0.070831298828125, -0.03125, 0.008331298828125, 0.04791259765625, 0.087493896484375, 0.1270751953125, 0.166656494140625, 0.20623779296875, 0.245819091796875, 0.285400390625, 0.324981689453125, 0.36456298828125, 0.404144287109375, 0.4437255859375, 0.483306884765625, 0.52288818359375, 0.562469482421875, 0.60205078125, 0.641632080078125, 0.68121337890625, 0.720794677734375, 0.7603759765625, 0.799957275390625, 0.83953857421875, 0.879119873046875, 0.918701171875, 0.958282470703125, 0.99786376953125, 1.037445068359375, 1.0770263671875, 1.116607666015625, 1.15618896484375, 1.195770263671875, 1.2353515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 5.0, 6.0, 6.0, 3.0, 17.0, 11.0, 17.0, 18.0, 26.0, 43.0, 21.0, 42.0, 55.0, 54.0, 62.0, 56.0, 72.0, 62.0, 73.0, 63.0, 45.0, 50.0, 26.0, 31.0, 30.0, 18.0, 19.0, 16.0, 14.0, 15.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55029296875, -0.5324020385742188, -0.5145111083984375, -0.49662017822265625, -0.478729248046875, -0.46083831787109375, -0.4429473876953125, -0.42505645751953125, -0.40716552734375, -0.38927459716796875, -0.3713836669921875, -0.35349273681640625, -0.335601806640625, -0.31771087646484375, -0.2998199462890625, -0.28192901611328125, -0.2640380859375, -0.24614715576171875, -0.2282562255859375, -0.21036529541015625, -0.192474365234375, -0.17458343505859375, -0.1566925048828125, -0.13880157470703125, -0.12091064453125, -0.10301971435546875, -0.0851287841796875, -0.06723785400390625, -0.049346923828125, -0.03145599365234375, -0.0135650634765625, 0.00432586669921875, 0.022216796875, 0.04010772705078125, 0.0579986572265625, 0.07588958740234375, 0.093780517578125, 0.11167144775390625, 0.1295623779296875, 0.14745330810546875, 0.16534423828125, 0.18323516845703125, 0.2011260986328125, 0.21901702880859375, 0.236907958984375, 0.25479888916015625, 0.2726898193359375, 0.29058074951171875, 0.3084716796875, 0.32636260986328125, 0.3442535400390625, 0.36214447021484375, 0.380035400390625, 0.39792633056640625, 0.4158172607421875, 0.43370819091796875, 0.45159912109375, 0.46949005126953125, 0.4873809814453125, 0.5052719116210938, 0.523162841796875, 0.5410537719726562, 0.5589447021484375, 0.5768356323242188, 0.5947265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 9.0, 13.0, 25.0, 36.0, 46.0, 92.0, 159.0, 379.0, 1145.0, 7766.0, 244910.0, 3870322.0, 64126.0, 3912.0, 797.0, 269.0, 115.0, 49.0, 35.0, 13.0, 14.0, 5.0, 13.0, 1.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.259765625, -2.2008514404296875, -2.141937255859375, -2.0830230712890625, -2.02410888671875, -1.9651947021484375, -1.906280517578125, -1.8473663330078125, -1.7884521484375, -1.7295379638671875, -1.670623779296875, -1.6117095947265625, -1.55279541015625, -1.4938812255859375, -1.434967041015625, -1.3760528564453125, -1.317138671875, -1.2582244873046875, -1.199310302734375, -1.1403961181640625, -1.08148193359375, -1.0225677490234375, -0.963653564453125, -0.9047393798828125, -0.8458251953125, -0.7869110107421875, -0.727996826171875, -0.6690826416015625, -0.61016845703125, -0.5512542724609375, -0.492340087890625, -0.4334259033203125, -0.37451171875, -0.3155975341796875, -0.256683349609375, -0.1977691650390625, -0.13885498046875, -0.0799407958984375, -0.021026611328125, 0.0378875732421875, 0.0968017578125, 0.1557159423828125, 0.214630126953125, 0.2735443115234375, 0.33245849609375, 0.3913726806640625, 0.450286865234375, 0.5092010498046875, 0.568115234375, 0.6270294189453125, 0.685943603515625, 0.7448577880859375, 0.80377197265625, 0.8626861572265625, 0.921600341796875, 0.9805145263671875, 1.0394287109375, 1.0983428955078125, 1.157257080078125, 1.2161712646484375, 1.27508544921875, 1.3339996337890625, 1.392913818359375, 1.4518280029296875, 1.5107421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 10.0, 28.0, 28.0, 63.0, 140.0, 218.0, 502.0, 909.0, 933.0, 592.0, 285.0, 152.0, 80.0, 54.0, 18.0, 20.0, 10.0, 10.0, 8.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0263671875, -0.997039794921875, -0.96771240234375, -0.938385009765625, -0.9090576171875, -0.879730224609375, -0.85040283203125, -0.821075439453125, -0.791748046875, -0.762420654296875, -0.73309326171875, -0.703765869140625, -0.6744384765625, -0.645111083984375, -0.61578369140625, -0.586456298828125, -0.55712890625, -0.527801513671875, -0.49847412109375, -0.469146728515625, -0.4398193359375, -0.410491943359375, -0.38116455078125, -0.351837158203125, -0.322509765625, -0.293182373046875, -0.26385498046875, -0.234527587890625, -0.2052001953125, -0.175872802734375, -0.14654541015625, -0.117218017578125, -0.087890625, -0.058563232421875, -0.02923583984375, 9.1552734375e-05, 0.0294189453125, 0.058746337890625, 0.08807373046875, 0.117401123046875, 0.146728515625, 0.176055908203125, 0.20538330078125, 0.234710693359375, 0.2640380859375, 0.293365478515625, 0.32269287109375, 0.352020263671875, 0.38134765625, 0.410675048828125, 0.44000244140625, 0.469329833984375, 0.4986572265625, 0.527984619140625, 0.55731201171875, 0.586639404296875, 0.615966796875, 0.645294189453125, 0.67462158203125, 0.703948974609375, 0.7332763671875, 0.762603759765625, 0.79193115234375, 0.821258544921875, 0.8505859375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 12.0, 82.0, 841.0, 80.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.266066312789917, -2.5464601516723633, -1.8268537521362305, -1.1072475910186768, -0.38764119148254395, 0.33196520805358887, 1.0515711307525635, 1.7711775302886963, 2.490783929824829, 3.210390090942383, 3.9299964904785156, 4.649602890014648, 5.369209289550781, 6.088815689086914, 6.8084211349487305, 7.528027534484863, 8.247633934020996, 8.967240333557129, 9.686846733093262, 10.406452178955078, 11.126058578491211, 11.845664978027344, 12.565271377563477, 13.28487777709961, 14.004484176635742, 14.724090576171875, 15.443696975708008, 16.16330337524414, 16.882909774780273, 17.602516174316406, 18.322120666503906, 19.041728973388672, 19.761333465576172, 20.480939865112305, 21.200546264648438, 21.92015266418457, 22.639759063720703, 23.359365463256836, 24.07897186279297, 24.79857635498047, 25.518184661865234, 26.237791061401367, 26.9573974609375, 27.677003860473633, 28.396610260009766, 29.1162166595459, 29.83582305908203, 30.55542755126953, 31.275033950805664, 31.994640350341797, 32.7142448425293, 33.43385314941406, 34.15345764160156, 34.87306594848633, 35.59267044067383, 36.312278747558594, 37.031883239746094, 37.751487731933594, 38.47109603881836, 39.19070053100586, 39.910308837890625, 40.629913330078125, 41.34952163696289, 42.06912612915039, 42.788734436035156]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 7.0, 4.0, 15.0, 16.0, 12.0, 27.0, 24.0, 26.0, 18.0, 21.0, 44.0, 43.0, 45.0, 55.0, 49.0, 51.0, 45.0, 66.0, 45.0, 47.0, 50.0, 37.0, 43.0, 32.0, 27.0, 28.0, 25.0, 24.0, 14.0, 10.0, 10.0, 10.0, 4.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3538265228271484, -2.278740406036377, -2.2036545276641846, -2.128568649291992, -2.0534825325012207, -1.9783965349197388, -1.9033105373382568, -1.828224539756775, -1.753138542175293, -1.678052544593811, -1.602966547012329, -1.5278805494308472, -1.4527945518493652, -1.3777085542678833, -1.3026225566864014, -1.2275365591049194, -1.1524505615234375, -1.0773645639419556, -1.0022785663604736, -0.9271925687789917, -0.8521065711975098, -0.7770205736160278, -0.7019345760345459, -0.626848578453064, -0.551762580871582, -0.4766765832901001, -0.40159058570861816, -0.32650458812713623, -0.2514185905456543, -0.17633259296417236, -0.10124659538269043, -0.026160597801208496, 0.04892563819885254, 0.12401163578033447, 0.1990976333618164, 0.27418363094329834, 0.3492696285247803, 0.4243556261062622, 0.49944162368774414, 0.5745276212692261, 0.649613618850708, 0.7246996164321899, 0.7997856140136719, 0.8748716115951538, 0.9499576091766357, 1.0250436067581177, 1.1001296043395996, 1.1752156019210815, 1.2503015995025635, 1.3253875970840454, 1.4004735946655273, 1.4755595922470093, 1.5506455898284912, 1.6257315874099731, 1.700817584991455, 1.775903582572937, 1.850989580154419, 1.9260755777359009, 2.001161575317383, 2.0762476921081543, 2.1513335704803467, 2.226419448852539, 2.3015055656433105, 2.376591682434082, 2.4516775608062744]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 7.0, 13.0, 11.0, 21.0, 16.0, 30.0, 62.0, 82.0, 100.0, 135.0, 206.0, 292.0, 441.0, 709.0, 1094.0, 2171.0, 4099.0, 9931.0, 41239.0, 441964.0, 481303.0, 44344.0, 10372.0, 4281.0, 2227.0, 1250.0, 765.0, 449.0, 318.0, 182.0, 124.0, 78.0, 65.0, 38.0, 35.0, 27.0, 15.0, 15.0, 10.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.5009765625, -1.4555206298828125, -1.410064697265625, -1.3646087646484375, -1.31915283203125, -1.2736968994140625, -1.228240966796875, -1.1827850341796875, -1.1373291015625, -1.0918731689453125, -1.046417236328125, -1.0009613037109375, -0.95550537109375, -0.9100494384765625, -0.864593505859375, -0.8191375732421875, -0.773681640625, -0.7282257080078125, -0.682769775390625, -0.6373138427734375, -0.59185791015625, -0.5464019775390625, -0.500946044921875, -0.4554901123046875, -0.4100341796875, -0.3645782470703125, -0.319122314453125, -0.2736663818359375, -0.22821044921875, -0.1827545166015625, -0.137298583984375, -0.0918426513671875, -0.04638671875, -0.0009307861328125, 0.044525146484375, 0.0899810791015625, 0.13543701171875, 0.1808929443359375, 0.226348876953125, 0.2718048095703125, 0.3172607421875, 0.3627166748046875, 0.408172607421875, 0.4536285400390625, 0.49908447265625, 0.5445404052734375, 0.589996337890625, 0.6354522705078125, 0.680908203125, 0.7263641357421875, 0.771820068359375, 0.8172760009765625, 0.86273193359375, 0.9081878662109375, 0.953643798828125, 0.9990997314453125, 1.0445556640625, 1.0900115966796875, 1.135467529296875, 1.1809234619140625, 1.22637939453125, 1.2718353271484375, 1.317291259765625, 1.3627471923828125, 1.408203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 15.0, 9.0, 12.0, 9.0, 23.0, 26.0, 33.0, 24.0, 42.0, 51.0, 70.0, 69.0, 65.0, 54.0, 65.0, 67.0, 64.0, 49.0, 45.0, 34.0, 27.0, 31.0, 26.0, 19.0, 17.0, 13.0, 10.0, 5.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.59027099609375, -0.5716552734375, -0.55303955078125, -0.534423828125, -0.51580810546875, -0.4971923828125, -0.47857666015625, -0.4599609375, -0.44134521484375, -0.4227294921875, -0.40411376953125, -0.385498046875, -0.36688232421875, -0.3482666015625, -0.32965087890625, -0.31103515625, -0.29241943359375, -0.2738037109375, -0.25518798828125, -0.236572265625, -0.21795654296875, -0.1993408203125, -0.18072509765625, -0.162109375, -0.14349365234375, -0.1248779296875, -0.10626220703125, -0.087646484375, -0.06903076171875, -0.0504150390625, -0.03179931640625, -0.01318359375, 0.00543212890625, 0.0240478515625, 0.04266357421875, 0.061279296875, 0.07989501953125, 0.0985107421875, 0.11712646484375, 0.1357421875, 0.15435791015625, 0.1729736328125, 0.19158935546875, 0.210205078125, 0.22882080078125, 0.2474365234375, 0.26605224609375, 0.28466796875, 0.30328369140625, 0.3218994140625, 0.34051513671875, 0.359130859375, 0.37774658203125, 0.3963623046875, 0.41497802734375, 0.43359375, 0.45220947265625, 0.4708251953125, 0.48944091796875, 0.508056640625, 0.52667236328125, 0.5452880859375, 0.56390380859375, 0.58251953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 4.0, 12.0, 10.0, 8.0, 8.0, 11.0, 16.0, 16.0, 21.0, 23.0, 36.0, 30.0, 39.0, 62.0, 93.0, 254.0, 991.0, 7010.0, 63030.0, 408635.0, 472696.0, 84194.0, 9393.0, 1223.0, 286.0, 101.0, 70.0, 42.0, 30.0, 26.0, 24.0, 30.0, 18.0, 22.0, 10.0, 8.0, 9.0, 9.0, 2.0, 12.0, 6.0, 3.0, 6.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0263671875, -0.9962387084960938, -0.9661102294921875, -0.9359817504882812, -0.905853271484375, -0.8757247924804688, -0.8455963134765625, -0.8154678344726562, -0.78533935546875, -0.7552108764648438, -0.7250823974609375, -0.6949539184570312, -0.664825439453125, -0.6346969604492188, -0.6045684814453125, -0.5744400024414062, -0.5443115234375, -0.5141830444335938, -0.4840545654296875, -0.45392608642578125, -0.423797607421875, -0.39366912841796875, -0.3635406494140625, -0.33341217041015625, -0.30328369140625, -0.27315521240234375, -0.2430267333984375, -0.21289825439453125, -0.182769775390625, -0.15264129638671875, -0.1225128173828125, -0.09238433837890625, -0.062255859375, -0.03212738037109375, -0.0019989013671875, 0.02812957763671875, 0.058258056640625, 0.08838653564453125, 0.1185150146484375, 0.14864349365234375, 0.17877197265625, 0.20890045166015625, 0.2390289306640625, 0.26915740966796875, 0.299285888671875, 0.32941436767578125, 0.3595428466796875, 0.38967132568359375, 0.4197998046875, 0.44992828369140625, 0.4800567626953125, 0.5101852416992188, 0.540313720703125, 0.5704421997070312, 0.6005706787109375, 0.6306991577148438, 0.66082763671875, 0.6909561157226562, 0.7210845947265625, 0.7512130737304688, 0.781341552734375, 0.8114700317382812, 0.8415985107421875, 0.8717269897460938, 0.90185546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 3.0, 6.0, 14.0, 14.0, 17.0, 22.0, 13.0, 18.0, 25.0, 16.0, 25.0, 25.0, 18.0, 34.0, 36.0, 35.0, 29.0, 29.0, 43.0, 35.0, 35.0, 28.0, 31.0, 33.0, 37.0, 34.0, 32.0, 31.0, 27.0, 27.0, 40.0, 28.0, 17.0, 16.0, 16.0, 18.0, 7.0, 13.0, 13.0, 14.0, 5.0, 10.0, 3.0, 6.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.9501953125, -0.9215240478515625, -0.892852783203125, -0.8641815185546875, -0.83551025390625, -0.8068389892578125, -0.778167724609375, -0.7494964599609375, -0.7208251953125, -0.6921539306640625, -0.663482666015625, -0.6348114013671875, -0.60614013671875, -0.5774688720703125, -0.548797607421875, -0.5201263427734375, -0.491455078125, -0.4627838134765625, -0.434112548828125, -0.4054412841796875, -0.37677001953125, -0.3480987548828125, -0.319427490234375, -0.2907562255859375, -0.2620849609375, -0.2334136962890625, -0.204742431640625, -0.1760711669921875, -0.14739990234375, -0.1187286376953125, -0.090057373046875, -0.0613861083984375, -0.03271484375, -0.0040435791015625, 0.024627685546875, 0.0532989501953125, 0.08197021484375, 0.1106414794921875, 0.139312744140625, 0.1679840087890625, 0.1966552734375, 0.2253265380859375, 0.253997802734375, 0.2826690673828125, 0.31134033203125, 0.3400115966796875, 0.368682861328125, 0.3973541259765625, 0.426025390625, 0.4546966552734375, 0.483367919921875, 0.5120391845703125, 0.54071044921875, 0.5693817138671875, 0.598052978515625, 0.6267242431640625, 0.6553955078125, 0.6840667724609375, 0.712738037109375, 0.7414093017578125, 0.77008056640625, 0.7987518310546875, 0.827423095703125, 0.8560943603515625, 0.884765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 12.0, 22.0, 22.0, 30.0, 39.0, 59.0, 92.0, 162.0, 272.0, 514.0, 982.0, 2161.0, 5677.0, 19603.0, 90168.0, 380780.0, 411639.0, 103047.0, 22505.0, 6197.0, 2243.0, 1019.0, 510.0, 282.0, 172.0, 110.0, 62.0, 47.0, 29.0, 24.0, 18.0, 4.0, 14.0, 9.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.25439453125, -0.24692153930664062, -0.23944854736328125, -0.23197555541992188, -0.2245025634765625, -0.21702957153320312, -0.20955657958984375, -0.20208358764648438, -0.194610595703125, -0.18713760375976562, -0.17966461181640625, -0.17219161987304688, -0.1647186279296875, -0.15724563598632812, -0.14977264404296875, -0.14229965209960938, -0.13482666015625, -0.12735366821289062, -0.11988067626953125, -0.11240768432617188, -0.1049346923828125, -0.09746170043945312, -0.08998870849609375, -0.08251571655273438, -0.075042724609375, -0.06756973266601562, -0.06009674072265625, -0.052623748779296875, -0.0451507568359375, -0.037677764892578125, -0.03020477294921875, -0.022731781005859375, -0.0152587890625, -0.007785797119140625, -0.00031280517578125, 0.007160186767578125, 0.0146331787109375, 0.022106170654296875, 0.02957916259765625, 0.037052154541015625, 0.044525146484375, 0.051998138427734375, 0.05947113037109375, 0.06694412231445312, 0.0744171142578125, 0.08189010620117188, 0.08936309814453125, 0.09683609008789062, 0.10430908203125, 0.11178207397460938, 0.11925506591796875, 0.12672805786132812, 0.1342010498046875, 0.14167404174804688, 0.14914703369140625, 0.15662002563476562, 0.164093017578125, 0.17156600952148438, 0.17903900146484375, 0.18651199340820312, 0.1939849853515625, 0.20145797729492188, 0.20893096923828125, 0.21640396118164062, 0.223876953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 11.0, 5.0, 22.0, 20.0, 38.0, 45.0, 52.0, 58.0, 87.0, 90.0, 95.0, 91.0, 73.0, 68.0, 53.0, 44.0, 28.0, 26.0, 21.0, 12.0, 10.0, 7.0, 2.0, 3.0, 6.0, 7.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.008676528930664e-05, -1.941155642271042e-05, -1.8736347556114197e-05, -1.8061138689517975e-05, -1.7385929822921753e-05, -1.671072095632553e-05, -1.603551208972931e-05, -1.5360303223133087e-05, -1.4685094356536865e-05, -1.4009885489940643e-05, -1.3334676623344421e-05, -1.26594677567482e-05, -1.1984258890151978e-05, -1.1309050023555756e-05, -1.0633841156959534e-05, -9.958632290363312e-06, -9.28342342376709e-06, -8.608214557170868e-06, -7.933005690574646e-06, -7.257796823978424e-06, -6.582587957382202e-06, -5.90737909078598e-06, -5.232170224189758e-06, -4.556961357593536e-06, -3.8817524909973145e-06, -3.2065436244010925e-06, -2.5313347578048706e-06, -1.8561258912086487e-06, -1.1809170246124268e-06, -5.057081580162048e-07, 1.695007085800171e-07, 8.44709575176239e-07, 1.519918441772461e-06, 2.195127308368683e-06, 2.8703361749649048e-06, 3.5455450415611267e-06, 4.220753908157349e-06, 4.8959627747535706e-06, 5.5711716413497925e-06, 6.246380507946014e-06, 6.921589374542236e-06, 7.596798241138458e-06, 8.27200710773468e-06, 8.947215974330902e-06, 9.622424840927124e-06, 1.0297633707523346e-05, 1.0972842574119568e-05, 1.164805144071579e-05, 1.2323260307312012e-05, 1.2998469173908234e-05, 1.3673678040504456e-05, 1.4348886907100677e-05, 1.50240957736969e-05, 1.569930464029312e-05, 1.6374513506889343e-05, 1.7049722373485565e-05, 1.7724931240081787e-05, 1.840014010667801e-05, 1.907534897327423e-05, 1.9750557839870453e-05, 2.0425766706466675e-05, 2.1100975573062897e-05, 2.177618443965912e-05, 2.245139330625534e-05, 2.3126602172851562e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 5.0, 6.0, 10.0, 14.0, 46.0, 110.0, 288.0, 675.0, 2221.0, 8798.0, 51933.0, 431966.0, 479041.0, 59942.0, 9861.0, 2446.0, 729.0, 251.0, 110.0, 47.0, 17.0, 18.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2509765625, -0.23958587646484375, -0.2281951904296875, -0.21680450439453125, -0.205413818359375, -0.19402313232421875, -0.1826324462890625, -0.17124176025390625, -0.15985107421875, -0.14846038818359375, -0.1370697021484375, -0.12567901611328125, -0.114288330078125, -0.10289764404296875, -0.0915069580078125, -0.08011627197265625, -0.0687255859375, -0.05733489990234375, -0.0459442138671875, -0.03455352783203125, -0.023162841796875, -0.01177215576171875, -0.0003814697265625, 0.01100921630859375, 0.02239990234375, 0.03379058837890625, 0.0451812744140625, 0.05657196044921875, 0.067962646484375, 0.07935333251953125, 0.0907440185546875, 0.10213470458984375, 0.113525390625, 0.12491607666015625, 0.1363067626953125, 0.14769744873046875, 0.159088134765625, 0.17047882080078125, 0.1818695068359375, 0.19326019287109375, 0.20465087890625, 0.21604156494140625, 0.2274322509765625, 0.23882293701171875, 0.250213623046875, 0.26160430908203125, 0.2729949951171875, 0.28438568115234375, 0.2957763671875, 0.30716705322265625, 0.3185577392578125, 0.32994842529296875, 0.341339111328125, 0.35272979736328125, 0.3641204833984375, 0.37551116943359375, 0.38690185546875, 0.39829254150390625, 0.4096832275390625, 0.42107391357421875, 0.432464599609375, 0.44385528564453125, 0.4552459716796875, 0.46663665771484375, 0.47802734375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 6.0, 7.0, 10.0, 13.0, 10.0, 22.0, 31.0, 40.0, 64.0, 46.0, 76.0, 79.0, 72.0, 74.0, 74.0, 74.0, 61.0, 43.0, 49.0, 38.0, 28.0, 22.0, 14.0, 15.0, 8.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2293701171875, -0.2222137451171875, -0.215057373046875, -0.2079010009765625, -0.20074462890625, -0.1935882568359375, -0.186431884765625, -0.1792755126953125, -0.172119140625, -0.1649627685546875, -0.157806396484375, -0.1506500244140625, -0.14349365234375, -0.1363372802734375, -0.129180908203125, -0.1220245361328125, -0.1148681640625, -0.1077117919921875, -0.100555419921875, -0.0933990478515625, -0.08624267578125, -0.0790863037109375, -0.071929931640625, -0.0647735595703125, -0.0576171875, -0.0504608154296875, -0.043304443359375, -0.0361480712890625, -0.02899169921875, -0.0218353271484375, -0.014678955078125, -0.0075225830078125, -0.0003662109375, 0.0067901611328125, 0.013946533203125, 0.0211029052734375, 0.02825927734375, 0.0354156494140625, 0.042572021484375, 0.0497283935546875, 0.056884765625, 0.0640411376953125, 0.071197509765625, 0.0783538818359375, 0.08551025390625, 0.0926666259765625, 0.099822998046875, 0.1069793701171875, 0.1141357421875, 0.1212921142578125, 0.128448486328125, 0.1356048583984375, 0.14276123046875, 0.1499176025390625, 0.157073974609375, 0.1642303466796875, 0.17138671875, 0.1785430908203125, 0.185699462890625, 0.1928558349609375, 0.20001220703125, 0.2071685791015625, 0.214324951171875, 0.2214813232421875, 0.2286376953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 19.0, 58.0, 212.0, 333.0, 251.0, 92.0, 33.0, 12.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.187150955200195, -16.878541946411133, -16.56993293762207, -16.261323928833008, -15.952713966369629, -15.644104957580566, -15.335495948791504, -15.026885986328125, -14.718276977539062, -14.40966796875, -14.101058959960938, -13.792448997497559, -13.483839988708496, -13.175230979919434, -12.866621971130371, -12.558012008666992, -12.24940299987793, -11.940793991088867, -11.632184982299805, -11.323575019836426, -11.014966011047363, -10.7063570022583, -10.397747993469238, -10.08913803100586, -9.780529975891113, -9.47192096710205, -9.163311958312988, -8.85470199584961, -8.546092987060547, -8.237483978271484, -7.928874969482422, -7.620265483856201, -7.311656475067139, -7.003047466278076, -6.6944379806518555, -6.385828971862793, -6.077219486236572, -5.76861047744751, -5.460000991821289, -5.151391983032227, -4.842782974243164, -4.534173965454102, -4.225564479827881, -3.9169554710388184, -3.6083459854125977, -3.299736976623535, -2.9911277294158936, -2.682518482208252, -2.3739089965820312, -2.0652997493743896, -1.756690502166748, -1.448081374168396, -1.1394721269607544, -0.8308628797531128, -0.5222537517547607, -0.21364450454711914, 0.09496474266052246, 0.4035739600658417, 0.7121831774711609, 1.0207923650741577, 1.3294016122817993, 1.638010859489441, 1.946619987487793, 2.2552292346954346, 2.563838481903076]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 8.0, 9.0, 8.0, 14.0, 12.0, 16.0, 18.0, 25.0, 24.0, 24.0, 33.0, 30.0, 46.0, 48.0, 57.0, 40.0, 60.0, 43.0, 49.0, 43.0, 50.0, 44.0, 39.0, 33.0, 41.0, 30.0, 22.0, 26.0, 11.0, 15.0, 12.0, 13.0, 14.0, 7.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.65399169921875, -5.475531101226807, -5.297070503234863, -5.11860990524292, -4.940149307250977, -4.761688232421875, -4.58322811126709, -4.404767036437988, -4.226306438446045, -4.047845840454102, -3.869385242462158, -3.690924644470215, -3.5124638080596924, -3.334003210067749, -3.1555426120758057, -2.977081775665283, -2.798621416091919, -2.6201608180999756, -2.4417002201080322, -2.2632393836975098, -2.0847787857055664, -1.906318187713623, -1.7278575897216797, -1.5493968725204468, -1.3709362745285034, -1.19247567653656, -1.0140149593353271, -0.8355543613433838, -0.6570937037467957, -0.4786330461502075, -0.30017244815826416, -0.12171173095703125, 0.05674886703491211, 0.23520950973033905, 0.413670152425766, 0.5921307802200317, 0.7705914378166199, 0.949052095413208, 1.1275126934051514, 1.3059734106063843, 1.4844340085983276, 1.662894606590271, 1.841355323791504, 2.0198159217834473, 2.1982765197753906, 2.376737117767334, 2.5551977157592773, 2.7336585521698, 2.912119150161743, 3.0905797481536865, 3.26904034614563, 3.4475011825561523, 3.6259617805480957, 3.804422378540039, 3.9828829765319824, 4.161343574523926, 4.339804172515869, 4.5182647705078125, 4.696725368499756, 4.875185966491699, 5.053646564483643, 5.232107162475586, 5.4105682373046875, 5.589028835296631, 5.767489433288574]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 2.0, 6.0, 8.0, 15.0, 9.0, 6.0, 9.0, 20.0, 21.0, 24.0, 18.0, 33.0, 45.0, 79.0, 96.0, 254.0, 640.0, 2363.0, 20859.0, 3136652.0, 1018685.0, 11618.0, 1716.0, 505.0, 211.0, 95.0, 74.0, 39.0, 38.0, 14.0, 16.0, 16.0, 19.0, 11.0, 8.0, 15.0, 8.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.683441162109375, -2.58367919921875, -2.483917236328125, -2.3841552734375, -2.284393310546875, -2.18463134765625, -2.084869384765625, -1.985107421875, -1.885345458984375, -1.78558349609375, -1.685821533203125, -1.5860595703125, -1.486297607421875, -1.38653564453125, -1.286773681640625, -1.18701171875, -1.087249755859375, -0.98748779296875, -0.887725830078125, -0.7879638671875, -0.688201904296875, -0.58843994140625, -0.488677978515625, -0.388916015625, -0.289154052734375, -0.18939208984375, -0.089630126953125, 0.0101318359375, 0.109893798828125, 0.20965576171875, 0.309417724609375, 0.4091796875, 0.508941650390625, 0.60870361328125, 0.708465576171875, 0.8082275390625, 0.907989501953125, 1.00775146484375, 1.107513427734375, 1.207275390625, 1.307037353515625, 1.40679931640625, 1.506561279296875, 1.6063232421875, 1.706085205078125, 1.80584716796875, 1.905609130859375, 2.00537109375, 2.105133056640625, 2.20489501953125, 2.304656982421875, 2.4044189453125, 2.504180908203125, 2.60394287109375, 2.703704833984375, 2.803466796875, 2.903228759765625, 3.00299072265625, 3.102752685546875, 3.2025146484375, 3.302276611328125, 3.40203857421875, 3.501800537109375, 3.6015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 4.0, 7.0, 6.0, 14.0, 14.0, 14.0, 6.0, 16.0, 26.0, 28.0, 30.0, 33.0, 34.0, 42.0, 46.0, 44.0, 59.0, 51.0, 46.0, 63.0, 49.0, 46.0, 45.0, 38.0, 42.0, 31.0, 22.0, 16.0, 25.0, 21.0, 20.0, 15.0, 6.0, 10.0, 7.0, 8.0, 3.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.470947265625, -0.45648193359375, -0.4420166015625, -0.42755126953125, -0.4130859375, -0.39862060546875, -0.3841552734375, -0.36968994140625, -0.355224609375, -0.34075927734375, -0.3262939453125, -0.31182861328125, -0.29736328125, -0.28289794921875, -0.2684326171875, -0.25396728515625, -0.239501953125, -0.22503662109375, -0.2105712890625, -0.19610595703125, -0.181640625, -0.16717529296875, -0.1527099609375, -0.13824462890625, -0.123779296875, -0.10931396484375, -0.0948486328125, -0.08038330078125, -0.06591796875, -0.05145263671875, -0.0369873046875, -0.02252197265625, -0.008056640625, 0.00640869140625, 0.0208740234375, 0.03533935546875, 0.0498046875, 0.06427001953125, 0.0787353515625, 0.09320068359375, 0.107666015625, 0.12213134765625, 0.1365966796875, 0.15106201171875, 0.16552734375, 0.17999267578125, 0.1944580078125, 0.20892333984375, 0.223388671875, 0.23785400390625, 0.2523193359375, 0.26678466796875, 0.28125, 0.29571533203125, 0.3101806640625, 0.32464599609375, 0.339111328125, 0.35357666015625, 0.3680419921875, 0.38250732421875, 0.39697265625, 0.41143798828125, 0.4259033203125, 0.44036865234375, 0.454833984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 7.0, 9.0, 11.0, 24.0, 25.0, 36.0, 63.0, 111.0, 193.0, 417.0, 775.0, 1695.0, 3861.0, 10449.0, 31700.0, 111856.0, 445305.0, 1736504.0, 1382339.0, 341587.0, 86962.0, 25806.0, 8461.0, 3305.0, 1402.0, 609.0, 312.0, 171.0, 103.0, 64.0, 34.0, 27.0, 16.0, 15.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70556640625, -0.6772384643554688, -0.6489105224609375, -0.6205825805664062, -0.592254638671875, -0.5639266967773438, -0.5355987548828125, -0.5072708129882812, -0.47894287109375, -0.45061492919921875, -0.4222869873046875, -0.39395904541015625, -0.365631103515625, -0.33730316162109375, -0.3089752197265625, -0.28064727783203125, -0.2523193359375, -0.22399139404296875, -0.1956634521484375, -0.16733551025390625, -0.139007568359375, -0.11067962646484375, -0.0823516845703125, -0.05402374267578125, -0.02569580078125, 0.00263214111328125, 0.0309600830078125, 0.05928802490234375, 0.087615966796875, 0.11594390869140625, 0.1442718505859375, 0.17259979248046875, 0.200927734375, 0.22925567626953125, 0.2575836181640625, 0.28591156005859375, 0.314239501953125, 0.34256744384765625, 0.3708953857421875, 0.39922332763671875, 0.42755126953125, 0.45587921142578125, 0.4842071533203125, 0.5125350952148438, 0.540863037109375, 0.5691909790039062, 0.5975189208984375, 0.6258468627929688, 0.6541748046875, 0.6825027465820312, 0.7108306884765625, 0.7391586303710938, 0.767486572265625, 0.7958145141601562, 0.8241424560546875, 0.8524703979492188, 0.88079833984375, 0.9091262817382812, 0.9374542236328125, 0.9657821655273438, 0.994110107421875, 1.0224380493164062, 1.0507659912109375, 1.0790939331054688, 1.107421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 7.0, 13.0, 23.0, 42.0, 33.0, 38.0, 64.0, 78.0, 98.0, 153.0, 199.0, 250.0, 320.0, 398.0, 475.0, 424.0, 338.0, 234.0, 218.0, 159.0, 117.0, 95.0, 91.0, 33.0, 42.0, 31.0, 24.0, 13.0, 16.0, 8.0, 4.0, 3.0, 6.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385009765625, -0.3698921203613281, -0.35477447509765625, -0.3396568298339844, -0.3245391845703125, -0.3094215393066406, -0.29430389404296875, -0.2791862487792969, -0.264068603515625, -0.24895095825195312, -0.23383331298828125, -0.21871566772460938, -0.2035980224609375, -0.18848037719726562, -0.17336273193359375, -0.15824508666992188, -0.14312744140625, -0.12800979614257812, -0.11289215087890625, -0.09777450561523438, -0.0826568603515625, -0.06753921508789062, -0.05242156982421875, -0.037303924560546875, -0.022186279296875, -0.007068634033203125, 0.00804901123046875, 0.023166656494140625, 0.0382843017578125, 0.053401947021484375, 0.06851959228515625, 0.08363723754882812, 0.0987548828125, 0.11387252807617188, 0.12899017333984375, 0.14410781860351562, 0.1592254638671875, 0.17434310913085938, 0.18946075439453125, 0.20457839965820312, 0.219696044921875, 0.23481369018554688, 0.24993133544921875, 0.2650489807128906, 0.2801666259765625, 0.2952842712402344, 0.31040191650390625, 0.3255195617675781, 0.34063720703125, 0.3557548522949219, 0.37087249755859375, 0.3859901428222656, 0.4011077880859375, 0.4162254333496094, 0.43134307861328125, 0.4464607238769531, 0.461578369140625, 0.4766960144042969, 0.49181365966796875, 0.5069313049316406, 0.5220489501953125, 0.5371665954589844, 0.5522842407226562, 0.5674018859863281, 0.58251953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 11.0, 41.0, 197.0, 322.0, 301.0, 95.0, 31.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.273847579956055, -8.005331993103027, -7.736815929412842, -7.468299865722656, -7.199783802032471, -6.931267738342285, -6.662752151489258, -6.394236087799072, -6.125720024108887, -5.857203960418701, -5.588688373565674, -5.320172309875488, -5.051656246185303, -4.783140182495117, -4.51462459564209, -4.246108531951904, -3.977592945098877, -3.7090771198272705, -3.440561056137085, -3.1720452308654785, -2.903529167175293, -2.6350133419036865, -2.36649751663208, -2.0979814529418945, -1.829465627670288, -1.560949683189392, -1.292433738708496, -1.0239179134368896, -0.7554019689559937, -0.48688602447509766, -0.2183701992034912, 0.050145745277404785, 0.3186616897583008, 0.5871776342391968, 0.855693519115448, 1.1242094039916992, 1.3927253484725952, 1.6612412929534912, 1.9297571182250977, 2.198273181915283, 2.4667890071868896, 2.735304832458496, 3.0038208961486816, 3.272336721420288, 3.5408525466918945, 3.80936861038208, 4.077884674072266, 4.346400260925293, 4.6149163246154785, 4.883432388305664, 5.151947975158691, 5.420464038848877, 5.6889801025390625, 5.95749568939209, 6.226011753082275, 6.494527816772461, 6.763043403625488, 7.031559467315674, 7.300075054168701, 7.568591117858887, 7.837107181549072, 8.105623245239258, 8.374138832092285, 8.642654418945312, 8.911170959472656]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 9.0, 11.0, 14.0, 16.0, 17.0, 14.0, 31.0, 21.0, 33.0, 34.0, 36.0, 41.0, 42.0, 50.0, 37.0, 42.0, 37.0, 33.0, 52.0, 43.0, 30.0, 42.0, 41.0, 35.0, 38.0, 30.0, 31.0, 21.0, 24.0, 22.0, 10.0, 10.0, 8.0, 10.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5067453384399414, -1.4565467834472656, -1.4063481092453003, -1.3561495542526245, -1.3059508800506592, -1.2557523250579834, -1.2055537700653076, -1.1553552150726318, -1.1051565408706665, -1.0549579858779907, -1.0047593116760254, -0.9545607566833496, -0.904362142086029, -0.8541635274887085, -0.8039649724960327, -0.7537663578987122, -0.7035677433013916, -0.653369128704071, -0.6031705141067505, -0.5529719591140747, -0.5027733445167542, -0.4525747299194336, -0.4023761451244354, -0.35217756032943726, -0.3019789457321167, -0.25178033113479614, -0.20158174633979797, -0.1513831466436386, -0.10118454694747925, -0.05098593235015869, -0.0007873475551605225, 0.049411237239837646, 0.09960973262786865, 0.14980833232402802, 0.20000693202018738, 0.25020551681518555, 0.3004041314125061, 0.35060274600982666, 0.40080133080482483, 0.450999915599823, 0.5011985301971436, 0.5513971447944641, 0.6015957593917847, 0.6517943143844604, 0.701992928981781, 0.7521915435791016, 0.8023900985717773, 0.8525887131690979, 0.9027873277664185, 0.952985942363739, 1.0031845569610596, 1.0533831119537354, 1.1035816669464111, 1.1537803411483765, 1.2039788961410522, 1.2541775703430176, 1.3043761253356934, 1.3545746803283691, 1.4047733545303345, 1.4549719095230103, 1.5051705837249756, 1.5553691387176514, 1.6055676937103271, 1.655766248703003, 1.7059649229049683]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 6.0, 8.0, 9.0, 14.0, 11.0, 22.0, 26.0, 45.0, 53.0, 93.0, 113.0, 175.0, 337.0, 635.0, 1110.0, 2252.0, 4833.0, 11313.0, 27245.0, 68411.0, 166538.0, 305793.0, 256908.0, 119640.0, 47829.0, 19274.0, 8332.0, 3703.0, 1754.0, 843.0, 461.0, 262.0, 166.0, 91.0, 72.0, 46.0, 27.0, 32.0, 20.0, 14.0, 9.0, 12.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.85888671875, -0.8334808349609375, -0.808074951171875, -0.7826690673828125, -0.75726318359375, -0.7318572998046875, -0.706451416015625, -0.6810455322265625, -0.6556396484375, -0.6302337646484375, -0.604827880859375, -0.5794219970703125, -0.55401611328125, -0.5286102294921875, -0.503204345703125, -0.4777984619140625, -0.452392578125, -0.4269866943359375, -0.401580810546875, -0.3761749267578125, -0.35076904296875, -0.3253631591796875, -0.299957275390625, -0.2745513916015625, -0.2491455078125, -0.2237396240234375, -0.198333740234375, -0.1729278564453125, -0.14752197265625, -0.1221160888671875, -0.096710205078125, -0.0713043212890625, -0.0458984375, -0.0204925537109375, 0.004913330078125, 0.0303192138671875, 0.05572509765625, 0.0811309814453125, 0.106536865234375, 0.1319427490234375, 0.1573486328125, 0.1827545166015625, 0.208160400390625, 0.2335662841796875, 0.25897216796875, 0.2843780517578125, 0.309783935546875, 0.3351898193359375, 0.360595703125, 0.3860015869140625, 0.411407470703125, 0.4368133544921875, 0.46221923828125, 0.4876251220703125, 0.513031005859375, 0.5384368896484375, 0.5638427734375, 0.5892486572265625, 0.614654541015625, 0.6400604248046875, 0.66546630859375, 0.6908721923828125, 0.716278076171875, 0.7416839599609375, 0.76708984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 11.0, 7.0, 10.0, 22.0, 11.0, 19.0, 22.0, 26.0, 26.0, 37.0, 36.0, 44.0, 60.0, 47.0, 56.0, 59.0, 58.0, 51.0, 64.0, 43.0, 57.0, 33.0, 25.0, 29.0, 26.0, 21.0, 23.0, 12.0, 12.0, 10.0, 9.0, 10.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.492431640625, -0.4770164489746094, -0.46160125732421875, -0.4461860656738281, -0.4307708740234375, -0.4153556823730469, -0.39994049072265625, -0.3845252990722656, -0.369110107421875, -0.3536949157714844, -0.33827972412109375, -0.3228645324707031, -0.3074493408203125, -0.2920341491699219, -0.27661895751953125, -0.2612037658691406, -0.24578857421875, -0.23037338256835938, -0.21495819091796875, -0.19954299926757812, -0.1841278076171875, -0.16871261596679688, -0.15329742431640625, -0.13788223266601562, -0.122467041015625, -0.10705184936523438, -0.09163665771484375, -0.07622146606445312, -0.0608062744140625, -0.045391082763671875, -0.02997589111328125, -0.014560699462890625, 0.0008544921875, 0.016269683837890625, 0.03168487548828125, 0.047100067138671875, 0.0625152587890625, 0.07793045043945312, 0.09334564208984375, 0.10876083374023438, 0.124176025390625, 0.13959121704101562, 0.15500640869140625, 0.17042160034179688, 0.1858367919921875, 0.20125198364257812, 0.21666717529296875, 0.23208236694335938, 0.24749755859375, 0.2629127502441406, 0.27832794189453125, 0.2937431335449219, 0.3091583251953125, 0.3245735168457031, 0.33998870849609375, 0.3554039001464844, 0.370819091796875, 0.3862342834472656, 0.40164947509765625, 0.4170646667480469, 0.4324798583984375, 0.4478950500488281, 0.46331024169921875, 0.4787254333496094, 0.494140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 9.0, 11.0, 18.0, 15.0, 27.0, 17.0, 23.0, 25.0, 32.0, 36.0, 51.0, 74.0, 128.0, 429.0, 3754.0, 138332.0, 835864.0, 66792.0, 2111.0, 307.0, 109.0, 69.0, 54.0, 32.0, 30.0, 27.0, 34.0, 30.0, 17.0, 15.0, 9.0, 11.0, 7.0, 6.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.78515625, -2.687103271484375, -2.58905029296875, -2.490997314453125, -2.3929443359375, -2.294891357421875, -2.19683837890625, -2.098785400390625, -2.000732421875, -1.902679443359375, -1.80462646484375, -1.706573486328125, -1.6085205078125, -1.510467529296875, -1.41241455078125, -1.314361572265625, -1.21630859375, -1.118255615234375, -1.02020263671875, -0.922149658203125, -0.8240966796875, -0.726043701171875, -0.62799072265625, -0.529937744140625, -0.431884765625, -0.333831787109375, -0.23577880859375, -0.137725830078125, -0.0396728515625, 0.058380126953125, 0.15643310546875, 0.254486083984375, 0.3525390625, 0.450592041015625, 0.54864501953125, 0.646697998046875, 0.7447509765625, 0.842803955078125, 0.94085693359375, 1.038909912109375, 1.136962890625, 1.235015869140625, 1.33306884765625, 1.431121826171875, 1.5291748046875, 1.627227783203125, 1.72528076171875, 1.823333740234375, 1.92138671875, 2.019439697265625, 2.11749267578125, 2.215545654296875, 2.3135986328125, 2.411651611328125, 2.50970458984375, 2.607757568359375, 2.705810546875, 2.803863525390625, 2.90191650390625, 2.999969482421875, 3.0980224609375, 3.196075439453125, 3.29412841796875, 3.392181396484375, 3.490234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 9.0, 4.0, 12.0, 13.0, 15.0, 16.0, 18.0, 24.0, 21.0, 15.0, 31.0, 23.0, 33.0, 35.0, 35.0, 32.0, 43.0, 30.0, 48.0, 27.0, 45.0, 31.0, 36.0, 35.0, 31.0, 52.0, 32.0, 41.0, 27.0, 21.0, 28.0, 28.0, 12.0, 15.0, 13.0, 6.0, 8.0, 13.0, 10.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.759765625, -0.7356643676757812, -0.7115631103515625, -0.6874618530273438, -0.663360595703125, -0.6392593383789062, -0.6151580810546875, -0.5910568237304688, -0.56695556640625, -0.5428543090820312, -0.5187530517578125, -0.49465179443359375, -0.470550537109375, -0.44644927978515625, -0.4223480224609375, -0.39824676513671875, -0.3741455078125, -0.35004425048828125, -0.3259429931640625, -0.30184173583984375, -0.277740478515625, -0.25363922119140625, -0.2295379638671875, -0.20543670654296875, -0.18133544921875, -0.15723419189453125, -0.1331329345703125, -0.10903167724609375, -0.084930419921875, -0.06082916259765625, -0.0367279052734375, -0.01262664794921875, 0.011474609375, 0.03557586669921875, 0.0596771240234375, 0.08377838134765625, 0.107879638671875, 0.13198089599609375, 0.1560821533203125, 0.18018341064453125, 0.20428466796875, 0.22838592529296875, 0.2524871826171875, 0.27658843994140625, 0.300689697265625, 0.32479095458984375, 0.3488922119140625, 0.37299346923828125, 0.3970947265625, 0.42119598388671875, 0.4452972412109375, 0.46939849853515625, 0.493499755859375, 0.5176010131835938, 0.5417022705078125, 0.5658035278320312, 0.58990478515625, 0.6140060424804688, 0.6381072998046875, 0.6622085571289062, 0.686309814453125, 0.7104110717773438, 0.7345123291015625, 0.7586135864257812, 0.78271484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 5.0, 8.0, 11.0, 11.0, 24.0, 18.0, 48.0, 75.0, 134.0, 244.0, 415.0, 917.0, 1928.0, 4230.0, 10799.0, 30880.0, 109807.0, 363967.0, 365521.0, 109711.0, 30839.0, 10724.0, 4322.0, 1908.0, 921.0, 472.0, 243.0, 134.0, 73.0, 37.0, 41.0, 25.0, 18.0, 12.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.53955078125, -0.5232009887695312, -0.5068511962890625, -0.49050140380859375, -0.474151611328125, -0.45780181884765625, -0.4414520263671875, -0.42510223388671875, -0.40875244140625, -0.39240264892578125, -0.3760528564453125, -0.35970306396484375, -0.343353271484375, -0.32700347900390625, -0.3106536865234375, -0.29430389404296875, -0.2779541015625, -0.26160430908203125, -0.2452545166015625, -0.22890472412109375, -0.212554931640625, -0.19620513916015625, -0.1798553466796875, -0.16350555419921875, -0.14715576171875, -0.13080596923828125, -0.1144561767578125, -0.09810638427734375, -0.081756591796875, -0.06540679931640625, -0.0490570068359375, -0.03270721435546875, -0.016357421875, -7.62939453125e-06, 0.0163421630859375, 0.03269195556640625, 0.049041748046875, 0.06539154052734375, 0.0817413330078125, 0.09809112548828125, 0.11444091796875, 0.13079071044921875, 0.1471405029296875, 0.16349029541015625, 0.179840087890625, 0.19618988037109375, 0.2125396728515625, 0.22888946533203125, 0.2452392578125, 0.26158905029296875, 0.2779388427734375, 0.29428863525390625, 0.310638427734375, 0.32698822021484375, 0.3433380126953125, 0.35968780517578125, 0.37603759765625, 0.39238739013671875, 0.4087371826171875, 0.42508697509765625, 0.441436767578125, 0.45778656005859375, 0.4741363525390625, 0.49048614501953125, 0.5068359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 14.0, 8.0, 16.0, 17.0, 24.0, 29.0, 56.0, 74.0, 94.0, 119.0, 127.0, 139.0, 72.0, 58.0, 48.0, 43.0, 16.0, 8.0, 8.0, 11.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.647275924682617e-05, -7.418449968099594e-05, -7.189624011516571e-05, -6.960798054933548e-05, -6.731972098350525e-05, -6.503146141767502e-05, -6.274320185184479e-05, -6.045494228601456e-05, -5.8166682720184326e-05, -5.5878423154354095e-05, -5.3590163588523865e-05, -5.1301904022693634e-05, -4.90136444568634e-05, -4.672538489103317e-05, -4.443712532520294e-05, -4.214886575937271e-05, -3.986060619354248e-05, -3.757234662771225e-05, -3.528408706188202e-05, -3.299582749605179e-05, -3.070756793022156e-05, -2.8419308364391327e-05, -2.6131048798561096e-05, -2.3842789232730865e-05, -2.1554529666900635e-05, -1.9266270101070404e-05, -1.6978010535240173e-05, -1.4689750969409943e-05, -1.2401491403579712e-05, -1.0113231837749481e-05, -7.82497227191925e-06, -5.53671270608902e-06, -3.248453140258789e-06, -9.601935744285583e-07, 1.3280659914016724e-06, 3.616325557231903e-06, 5.904585123062134e-06, 8.192844688892365e-06, 1.0481104254722595e-05, 1.2769363820552826e-05, 1.5057623386383057e-05, 1.7345882952213287e-05, 1.9634142518043518e-05, 2.192240208387375e-05, 2.421066164970398e-05, 2.649892121553421e-05, 2.878718078136444e-05, 3.107544034719467e-05, 3.33636999130249e-05, 3.565195947885513e-05, 3.7940219044685364e-05, 4.0228478610515594e-05, 4.2516738176345825e-05, 4.4804997742176056e-05, 4.709325730800629e-05, 4.938151687383652e-05, 5.166977643966675e-05, 5.395803600549698e-05, 5.624629557132721e-05, 5.853455513715744e-05, 6.082281470298767e-05, 6.31110742688179e-05, 6.539933383464813e-05, 6.768759340047836e-05, 6.99758529663086e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 2.0, 7.0, 10.0, 15.0, 15.0, 16.0, 12.0, 16.0, 29.0, 30.0, 45.0, 75.0, 153.0, 463.0, 2400.0, 21764.0, 322943.0, 638040.0, 56431.0, 4733.0, 771.0, 233.0, 102.0, 40.0, 25.0, 27.0, 23.0, 21.0, 19.0, 12.0, 13.0, 9.0, 4.0, 8.0, 4.0, 6.0, 3.0, 8.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97119140625, -0.941009521484375, -0.91082763671875, -0.880645751953125, -0.8504638671875, -0.820281982421875, -0.79010009765625, -0.759918212890625, -0.729736328125, -0.699554443359375, -0.66937255859375, -0.639190673828125, -0.6090087890625, -0.578826904296875, -0.54864501953125, -0.518463134765625, -0.48828125, -0.458099365234375, -0.42791748046875, -0.397735595703125, -0.3675537109375, -0.337371826171875, -0.30718994140625, -0.277008056640625, -0.246826171875, -0.216644287109375, -0.18646240234375, -0.156280517578125, -0.1260986328125, -0.095916748046875, -0.06573486328125, -0.035552978515625, -0.00537109375, 0.024810791015625, 0.05499267578125, 0.085174560546875, 0.1153564453125, 0.145538330078125, 0.17572021484375, 0.205902099609375, 0.236083984375, 0.266265869140625, 0.29644775390625, 0.326629638671875, 0.3568115234375, 0.386993408203125, 0.41717529296875, 0.447357177734375, 0.4775390625, 0.507720947265625, 0.53790283203125, 0.568084716796875, 0.5982666015625, 0.628448486328125, 0.65863037109375, 0.688812255859375, 0.718994140625, 0.749176025390625, 0.77935791015625, 0.809539794921875, 0.8397216796875, 0.869903564453125, 0.90008544921875, 0.930267333984375, 0.96044921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 5.0, 3.0, 6.0, 8.0, 15.0, 13.0, 16.0, 20.0, 18.0, 26.0, 31.0, 37.0, 32.0, 42.0, 38.0, 45.0, 68.0, 64.0, 59.0, 61.0, 54.0, 56.0, 34.0, 39.0, 31.0, 19.0, 22.0, 18.0, 26.0, 12.0, 17.0, 8.0, 4.0, 11.0, 5.0, 7.0, 3.0, 6.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.2449951171875, -0.23816299438476562, -0.23133087158203125, -0.22449874877929688, -0.2176666259765625, -0.21083450317382812, -0.20400238037109375, -0.19717025756835938, -0.190338134765625, -0.18350601196289062, -0.17667388916015625, -0.16984176635742188, -0.1630096435546875, -0.15617752075195312, -0.14934539794921875, -0.14251327514648438, -0.13568115234375, -0.12884902954101562, -0.12201690673828125, -0.11518478393554688, -0.1083526611328125, -0.10152053833007812, -0.09468841552734375, -0.08785629272460938, -0.081024169921875, -0.07419204711914062, -0.06735992431640625, -0.060527801513671875, -0.0536956787109375, -0.046863555908203125, -0.04003143310546875, -0.033199310302734375, -0.0263671875, -0.019535064697265625, -0.01270294189453125, -0.005870819091796875, 0.0009613037109375, 0.007793426513671875, 0.01462554931640625, 0.021457672119140625, 0.028289794921875, 0.035121917724609375, 0.04195404052734375, 0.048786163330078125, 0.0556182861328125, 0.062450408935546875, 0.06928253173828125, 0.07611465454101562, 0.08294677734375, 0.08977890014648438, 0.09661102294921875, 0.10344314575195312, 0.1102752685546875, 0.11710739135742188, 0.12393951416015625, 0.13077163696289062, 0.137603759765625, 0.14443588256835938, 0.15126800537109375, 0.15810012817382812, 0.1649322509765625, 0.17176437377929688, 0.17859649658203125, 0.18542861938476562, 0.1922607421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 71.0, 536.0, 370.0, 27.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.06617546081543, -24.51956558227539, -23.97295570373535, -23.426345825195312, -22.879737854003906, -22.333127975463867, -21.786518096923828, -21.23990821838379, -20.69329833984375, -20.14668846130371, -19.600078582763672, -19.053470611572266, -18.506860733032227, -17.960250854492188, -17.41364097595215, -16.86703109741211, -16.320423126220703, -15.773813247680664, -15.227204322814941, -14.680594444274902, -14.133984565734863, -13.58737564086914, -13.040765762329102, -12.494155883789062, -11.947546005249023, -11.400936126708984, -10.854327201843262, -10.307717323303223, -9.761107444763184, -9.214498519897461, -8.667888641357422, -8.121278762817383, -7.57466983795166, -7.028060436248779, -6.48145055770874, -5.934841156005859, -5.38823127746582, -4.8416218757629395, -4.295012474060059, -3.7484028339385986, -3.2017931938171387, -2.6551835536956787, -2.1085739135742188, -1.561964511871338, -1.015354871749878, -0.46874523162841797, 0.07786417007446289, 0.6244738101959229, 1.1710834503173828, 1.7176930904388428, 2.2643027305603027, 2.8109121322631836, 3.3575217723846436, 3.9041314125061035, 4.450740814208984, 4.997350692749023, 5.543960094451904, 6.090569496154785, 6.637179374694824, 7.183788776397705, 7.730398178100586, 8.277008056640625, 8.823617935180664, 9.370226860046387, 9.916836738586426]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 5.0, 2.0, 8.0, 6.0, 4.0, 12.0, 11.0, 10.0, 17.0, 15.0, 31.0, 28.0, 24.0, 18.0, 31.0, 31.0, 33.0, 40.0, 40.0, 39.0, 48.0, 43.0, 43.0, 40.0, 45.0, 29.0, 48.0, 38.0, 33.0, 37.0, 30.0, 23.0, 23.0, 20.0, 14.0, 11.0, 8.0, 7.0, 10.0, 14.0, 5.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.0680222511291504, -2.9741525650024414, -2.8802831172943115, -2.7864134311676025, -2.6925439834594727, -2.5986742973327637, -2.5048046112060547, -2.410935163497925, -2.317065715789795, -2.223196029663086, -2.129326581954956, -2.035456895828247, -1.9415874481201172, -1.8477177619934082, -1.7538481950759888, -1.6599786281585693, -1.5661089420318604, -1.472239375114441, -1.3783698081970215, -1.2845001220703125, -1.1906306743621826, -1.0967609882354736, -1.0028914213180542, -0.9090218544006348, -0.8151522874832153, -0.7212827205657959, -0.6274131536483765, -0.5335435271263123, -0.4396739602088928, -0.3458043932914734, -0.2519347667694092, -0.15806519985198975, -0.06419539451599121, 0.029674187302589417, 0.12354376912117004, 0.21741336584091187, 0.3112829327583313, 0.40515249967575073, 0.49902212619781494, 0.5928916931152344, 0.6867612600326538, 0.7806308269500732, 0.8745003938674927, 0.9683700203895569, 1.062239646911621, 1.156109094619751, 1.24997878074646, 1.3438483476638794, 1.4377179145812988, 1.5315874814987183, 1.6254570484161377, 1.7193267345428467, 1.8131961822509766, 1.9070658683776855, 2.0009355545043945, 2.0948050022125244, 2.1886744499206543, 2.2825441360473633, 2.376413583755493, 2.470283269882202, 2.564152717590332, 2.658022403717041, 2.75189208984375, 2.84576153755188, 2.939631223678589]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 10.0, 8.0, 15.0, 27.0, 22.0, 48.0, 47.0, 89.0, 111.0, 158.0, 271.0, 409.0, 862.0, 1744.0, 4696.0, 15691.0, 73557.0, 604879.0, 2928641.0, 479315.0, 62428.0, 13599.0, 4208.0, 1602.0, 719.0, 381.0, 233.0, 152.0, 102.0, 65.0, 53.0, 33.0, 28.0, 14.0, 14.0, 14.0, 8.0, 6.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.1627197265625, -1.120361328125, -1.0780029296875, -1.03564453125, -0.9932861328125, -0.950927734375, -0.9085693359375, -0.8662109375, -0.8238525390625, -0.781494140625, -0.7391357421875, -0.69677734375, -0.6544189453125, -0.612060546875, -0.5697021484375, -0.52734375, -0.4849853515625, -0.442626953125, -0.4002685546875, -0.35791015625, -0.3155517578125, -0.273193359375, -0.2308349609375, -0.1884765625, -0.1461181640625, -0.103759765625, -0.0614013671875, -0.01904296875, 0.0233154296875, 0.065673828125, 0.1080322265625, 0.150390625, 0.1927490234375, 0.235107421875, 0.2774658203125, 0.31982421875, 0.3621826171875, 0.404541015625, 0.4468994140625, 0.4892578125, 0.5316162109375, 0.573974609375, 0.6163330078125, 0.65869140625, 0.7010498046875, 0.743408203125, 0.7857666015625, 0.828125, 0.8704833984375, 0.912841796875, 0.9552001953125, 0.99755859375, 1.0399169921875, 1.082275390625, 1.1246337890625, 1.1669921875, 1.2093505859375, 1.251708984375, 1.2940673828125, 1.33642578125, 1.3787841796875, 1.421142578125, 1.4635009765625, 1.505859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 8.0, 11.0, 16.0, 8.0, 15.0, 19.0, 26.0, 29.0, 29.0, 40.0, 49.0, 51.0, 71.0, 55.0, 48.0, 53.0, 56.0, 61.0, 60.0, 51.0, 51.0, 35.0, 33.0, 25.0, 20.0, 18.0, 12.0, 13.0, 8.0, 7.0, 6.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5147781372070312, -0.4983062744140625, -0.48183441162109375, -0.465362548828125, -0.44889068603515625, -0.4324188232421875, -0.41594696044921875, -0.39947509765625, -0.38300323486328125, -0.3665313720703125, -0.35005950927734375, -0.333587646484375, -0.31711578369140625, -0.3006439208984375, -0.28417205810546875, -0.2677001953125, -0.25122833251953125, -0.2347564697265625, -0.21828460693359375, -0.201812744140625, -0.18534088134765625, -0.1688690185546875, -0.15239715576171875, -0.13592529296875, -0.11945343017578125, -0.1029815673828125, -0.08650970458984375, -0.070037841796875, -0.05356597900390625, -0.0370941162109375, -0.02062225341796875, -0.004150390625, 0.01232147216796875, 0.0287933349609375, 0.04526519775390625, 0.061737060546875, 0.07820892333984375, 0.0946807861328125, 0.11115264892578125, 0.12762451171875, 0.14409637451171875, 0.1605682373046875, 0.17704010009765625, 0.193511962890625, 0.20998382568359375, 0.2264556884765625, 0.24292755126953125, 0.2593994140625, 0.27587127685546875, 0.2923431396484375, 0.30881500244140625, 0.325286865234375, 0.34175872802734375, 0.3582305908203125, 0.37470245361328125, 0.39117431640625, 0.40764617919921875, 0.4241180419921875, 0.44058990478515625, 0.457061767578125, 0.47353363037109375, 0.4900054931640625, 0.5064773559570312, 0.52294921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 6.0, 21.0, 17.0, 33.0, 56.0, 103.0, 208.0, 367.0, 813.0, 1931.0, 5711.0, 19805.0, 79772.0, 381731.0, 1721793.0, 1546447.0, 337316.0, 71942.0, 17724.0, 5129.0, 1792.0, 778.0, 336.0, 180.0, 102.0, 66.0, 36.0, 24.0, 14.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.32977294921875, -1.2894287109375, -1.24908447265625, -1.208740234375, -1.16839599609375, -1.1280517578125, -1.08770751953125, -1.04736328125, -1.00701904296875, -0.9666748046875, -0.92633056640625, -0.885986328125, -0.84564208984375, -0.8052978515625, -0.76495361328125, -0.724609375, -0.68426513671875, -0.6439208984375, -0.60357666015625, -0.563232421875, -0.52288818359375, -0.4825439453125, -0.44219970703125, -0.40185546875, -0.36151123046875, -0.3211669921875, -0.28082275390625, -0.240478515625, -0.20013427734375, -0.1597900390625, -0.11944580078125, -0.0791015625, -0.03875732421875, 0.0015869140625, 0.04193115234375, 0.082275390625, 0.12261962890625, 0.1629638671875, 0.20330810546875, 0.24365234375, 0.28399658203125, 0.3243408203125, 0.36468505859375, 0.405029296875, 0.44537353515625, 0.4857177734375, 0.52606201171875, 0.56640625, 0.60675048828125, 0.6470947265625, 0.68743896484375, 0.727783203125, 0.76812744140625, 0.8084716796875, 0.84881591796875, 0.88916015625, 0.92950439453125, 0.9698486328125, 1.01019287109375, 1.050537109375, 1.09088134765625, 1.1312255859375, 1.17156982421875, 1.2119140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 13.0, 9.0, 22.0, 23.0, 30.0, 44.0, 69.0, 94.0, 105.0, 177.0, 228.0, 278.0, 359.0, 461.0, 465.0, 386.0, 275.0, 249.0, 180.0, 163.0, 92.0, 93.0, 70.0, 48.0, 37.0, 24.0, 18.0, 13.0, 12.0, 6.0, 6.0, 5.0, 2.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6384658813476562, -0.6172637939453125, -0.5960617065429688, -0.574859619140625, -0.5536575317382812, -0.5324554443359375, -0.5112533569335938, -0.49005126953125, -0.46884918212890625, -0.4476470947265625, -0.42644500732421875, -0.405242919921875, -0.38404083251953125, -0.3628387451171875, -0.34163665771484375, -0.3204345703125, -0.29923248291015625, -0.2780303955078125, -0.25682830810546875, -0.235626220703125, -0.21442413330078125, -0.1932220458984375, -0.17201995849609375, -0.15081787109375, -0.12961578369140625, -0.1084136962890625, -0.08721160888671875, -0.066009521484375, -0.04480743408203125, -0.0236053466796875, -0.00240325927734375, 0.018798828125, 0.04000091552734375, 0.0612030029296875, 0.08240509033203125, 0.103607177734375, 0.12480926513671875, 0.1460113525390625, 0.16721343994140625, 0.18841552734375, 0.20961761474609375, 0.2308197021484375, 0.25202178955078125, 0.273223876953125, 0.29442596435546875, 0.3156280517578125, 0.33683013916015625, 0.3580322265625, 0.37923431396484375, 0.4004364013671875, 0.42163848876953125, 0.442840576171875, 0.46404266357421875, 0.4852447509765625, 0.5064468383789062, 0.52764892578125, 0.5488510131835938, 0.5700531005859375, 0.5912551879882812, 0.612457275390625, 0.6336593627929688, 0.6548614501953125, 0.6760635375976562, 0.697265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 12.0, 103.0, 414.0, 370.0, 94.0, 16.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.4108829498291, -17.938404083251953, -17.465925216674805, -16.993446350097656, -16.520967483520508, -16.04848861694336, -15.576010704040527, -15.103531837463379, -14.63105297088623, -14.158574104309082, -13.686095237731934, -13.213617324829102, -12.741138458251953, -12.268659591674805, -11.796180725097656, -11.323701858520508, -10.85122299194336, -10.378744125366211, -9.906265258789062, -9.433786392211914, -8.961308479309082, -8.488829612731934, -8.016350746154785, -7.543871879577637, -7.071393966674805, -6.598915100097656, -6.126436710357666, -5.653957843780518, -5.181478977203369, -4.709000587463379, -4.2365217208862305, -3.764042854309082, -3.2915639877319336, -2.8190853595733643, -2.346606492996216, -1.8741278648376465, -1.4016491174697876, -0.9291703701019287, -0.4566917419433594, 0.015787124633789062, 0.4882657527923584, 0.9607445001602173, 1.4332232475280762, 1.9057018756866455, 2.378180503845215, 2.8506593704223633, 3.3231379985809326, 3.795616865158081, 4.26809549331665, 4.740574359893799, 5.213052749633789, 5.6855316162109375, 6.158010482788086, 6.630489349365234, 7.102967739105225, 7.575446605682373, 8.047924995422363, 8.520403861999512, 8.99288272857666, 9.465360641479492, 9.93783950805664, 10.410318374633789, 10.882797241210938, 11.355276107788086, 11.827754974365234]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 9.0, 8.0, 12.0, 20.0, 10.0, 22.0, 23.0, 20.0, 23.0, 32.0, 31.0, 38.0, 41.0, 34.0, 48.0, 48.0, 53.0, 40.0, 42.0, 52.0, 37.0, 52.0, 37.0, 30.0, 38.0, 23.0, 27.0, 19.0, 20.0, 15.0, 11.0, 14.0, 13.0, 8.0, 17.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.070319414138794, -2.000481128692627, -1.930643081665039, -1.8608049154281616, -1.7909667491912842, -1.7211284637451172, -1.6512902975082397, -1.5814521312713623, -1.5116139650344849, -1.4417757987976074, -1.37193763256073, -1.3020994663238525, -1.2322611808776855, -1.1624231338500977, -1.0925848484039307, -1.0227466821670532, -0.9529085159301758, -0.8830703496932983, -0.8132321834564209, -0.7433939576148987, -0.6735557913780212, -0.6037176251411438, -0.5338793992996216, -0.46404123306274414, -0.3942030668258667, -0.32436490058898926, -0.25452670454978943, -0.1846885234117508, -0.11485034227371216, -0.04501217603683472, 0.024826020002365112, 0.09466421604156494, 0.16450214385986328, 0.23434032499790192, 0.30417850613594055, 0.3740167021751404, 0.4438548684120178, 0.5136930346488953, 0.5835312604904175, 0.6533694267272949, 0.7232075929641724, 0.7930457592010498, 0.8628839254379272, 0.9327221512794495, 1.0025603771209717, 1.0723984241485596, 1.1422367095947266, 1.212074875831604, 1.2819130420684814, 1.3517512083053589, 1.4215893745422363, 1.4914275407791138, 1.5612657070159912, 1.6311039924621582, 1.7009421586990356, 1.770780324935913, 1.8406184911727905, 1.910456657409668, 1.9802948236465454, 2.050132989883423, 2.11997127532959, 2.1898093223571777, 2.2596476078033447, 2.3294858932495117, 2.3993239402770996]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 7.0, 14.0, 26.0, 41.0, 79.0, 147.0, 382.0, 866.0, 2185.0, 5658.0, 16915.0, 85325.0, 482121.0, 375312.0, 58284.0, 13298.0, 4717.0, 1797.0, 752.0, 302.0, 139.0, 69.0, 29.0, 21.0, 16.0, 10.0, 8.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.466796875, -2.38946533203125, -2.3121337890625, -2.23480224609375, -2.157470703125, -2.08013916015625, -2.0028076171875, -1.92547607421875, -1.84814453125, -1.77081298828125, -1.6934814453125, -1.61614990234375, -1.538818359375, -1.46148681640625, -1.3841552734375, -1.30682373046875, -1.2294921875, -1.15216064453125, -1.0748291015625, -0.99749755859375, -0.920166015625, -0.84283447265625, -0.7655029296875, -0.68817138671875, -0.61083984375, -0.53350830078125, -0.4561767578125, -0.37884521484375, -0.301513671875, -0.22418212890625, -0.1468505859375, -0.06951904296875, 0.0078125, 0.08514404296875, 0.1624755859375, 0.23980712890625, 0.317138671875, 0.39447021484375, 0.4718017578125, 0.54913330078125, 0.62646484375, 0.70379638671875, 0.7811279296875, 0.85845947265625, 0.935791015625, 1.01312255859375, 1.0904541015625, 1.16778564453125, 1.2451171875, 1.32244873046875, 1.3997802734375, 1.47711181640625, 1.554443359375, 1.63177490234375, 1.7091064453125, 1.78643798828125, 1.86376953125, 1.94110107421875, 2.0184326171875, 2.09576416015625, 2.173095703125, 2.25042724609375, 2.3277587890625, 2.40509033203125, 2.482421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 11.0, 15.0, 14.0, 22.0, 27.0, 29.0, 30.0, 43.0, 54.0, 67.0, 59.0, 68.0, 56.0, 81.0, 62.0, 70.0, 68.0, 44.0, 33.0, 37.0, 26.0, 20.0, 14.0, 15.0, 10.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.642578125, -0.6239776611328125, -0.605377197265625, -0.5867767333984375, -0.56817626953125, -0.5495758056640625, -0.530975341796875, -0.5123748779296875, -0.4937744140625, -0.4751739501953125, -0.456573486328125, -0.4379730224609375, -0.41937255859375, -0.4007720947265625, -0.382171630859375, -0.3635711669921875, -0.344970703125, -0.3263702392578125, -0.307769775390625, -0.2891693115234375, -0.27056884765625, -0.2519683837890625, -0.233367919921875, -0.2147674560546875, -0.1961669921875, -0.1775665283203125, -0.158966064453125, -0.1403656005859375, -0.12176513671875, -0.1031646728515625, -0.084564208984375, -0.0659637451171875, -0.04736328125, -0.0287628173828125, -0.010162353515625, 0.0084381103515625, 0.02703857421875, 0.0456390380859375, 0.064239501953125, 0.0828399658203125, 0.1014404296875, 0.1200408935546875, 0.138641357421875, 0.1572418212890625, 0.17584228515625, 0.1944427490234375, 0.213043212890625, 0.2316436767578125, 0.250244140625, 0.2688446044921875, 0.287445068359375, 0.3060455322265625, 0.32464599609375, 0.3432464599609375, 0.361846923828125, 0.3804473876953125, 0.3990478515625, 0.4176483154296875, 0.436248779296875, 0.4548492431640625, 0.47344970703125, 0.4920501708984375, 0.510650634765625, 0.5292510986328125, 0.5478515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 6.0, 6.0, 8.0, 5.0, 14.0, 10.0, 18.0, 21.0, 33.0, 53.0, 80.0, 126.0, 188.0, 374.0, 712.0, 1451.0, 3008.0, 6141.0, 13874.0, 37405.0, 128467.0, 355691.0, 332053.0, 111543.0, 33000.0, 12789.0, 5713.0, 2813.0, 1400.0, 668.0, 347.0, 169.0, 134.0, 62.0, 48.0, 42.0, 18.0, 17.0, 12.0, 11.0, 5.0, 6.0, 6.0, 4.0, 0.0, 7.0, 0.0, 1.0, 2.0], "bins": [-1.677734375, -1.63232421875, -1.5869140625, -1.54150390625, -1.49609375, -1.45068359375, -1.4052734375, -1.35986328125, -1.314453125, -1.26904296875, -1.2236328125, -1.17822265625, -1.1328125, -1.08740234375, -1.0419921875, -0.99658203125, -0.951171875, -0.90576171875, -0.8603515625, -0.81494140625, -0.76953125, -0.72412109375, -0.6787109375, -0.63330078125, -0.587890625, -0.54248046875, -0.4970703125, -0.45166015625, -0.40625, -0.36083984375, -0.3154296875, -0.27001953125, -0.224609375, -0.17919921875, -0.1337890625, -0.08837890625, -0.04296875, 0.00244140625, 0.0478515625, 0.09326171875, 0.138671875, 0.18408203125, 0.2294921875, 0.27490234375, 0.3203125, 0.36572265625, 0.4111328125, 0.45654296875, 0.501953125, 0.54736328125, 0.5927734375, 0.63818359375, 0.68359375, 0.72900390625, 0.7744140625, 0.81982421875, 0.865234375, 0.91064453125, 0.9560546875, 1.00146484375, 1.046875, 1.09228515625, 1.1376953125, 1.18310546875, 1.228515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 9.0, 6.0, 17.0, 10.0, 19.0, 22.0, 19.0, 32.0, 29.0, 41.0, 42.0, 31.0, 46.0, 59.0, 55.0, 64.0, 50.0, 56.0, 55.0, 42.0, 43.0, 41.0, 28.0, 36.0, 20.0, 20.0, 19.0, 18.0, 18.0, 10.0, 10.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.943359375, -0.9108123779296875, -0.878265380859375, -0.8457183837890625, -0.81317138671875, -0.7806243896484375, -0.748077392578125, -0.7155303955078125, -0.6829833984375, -0.6504364013671875, -0.617889404296875, -0.5853424072265625, -0.55279541015625, -0.5202484130859375, -0.487701416015625, -0.4551544189453125, -0.422607421875, -0.3900604248046875, -0.357513427734375, -0.3249664306640625, -0.29241943359375, -0.2598724365234375, -0.227325439453125, -0.1947784423828125, -0.1622314453125, -0.1296844482421875, -0.097137451171875, -0.0645904541015625, -0.03204345703125, 0.0005035400390625, 0.033050537109375, 0.0655975341796875, 0.09814453125, 0.1306915283203125, 0.163238525390625, 0.1957855224609375, 0.22833251953125, 0.2608795166015625, 0.293426513671875, 0.3259735107421875, 0.3585205078125, 0.3910675048828125, 0.423614501953125, 0.4561614990234375, 0.48870849609375, 0.5212554931640625, 0.553802490234375, 0.5863494873046875, 0.618896484375, 0.6514434814453125, 0.683990478515625, 0.7165374755859375, 0.74908447265625, 0.7816314697265625, 0.814178466796875, 0.8467254638671875, 0.8792724609375, 0.9118194580078125, 0.944366455078125, 0.9769134521484375, 1.00946044921875, 1.0420074462890625, 1.074554443359375, 1.1071014404296875, 1.1396484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 5.0, 26.0, 38.0, 50.0, 85.0, 154.0, 225.0, 429.0, 759.0, 1522.0, 4145.0, 17709.0, 238010.0, 719525.0, 53035.0, 7795.0, 2502.0, 1163.0, 586.0, 316.0, 186.0, 102.0, 66.0, 32.0, 25.0, 14.0, 14.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.173828125, -2.10845947265625, -2.0430908203125, -1.97772216796875, -1.912353515625, -1.84698486328125, -1.7816162109375, -1.71624755859375, -1.65087890625, -1.58551025390625, -1.5201416015625, -1.45477294921875, -1.389404296875, -1.32403564453125, -1.2586669921875, -1.19329833984375, -1.1279296875, -1.06256103515625, -0.9971923828125, -0.93182373046875, -0.866455078125, -0.80108642578125, -0.7357177734375, -0.67034912109375, -0.60498046875, -0.53961181640625, -0.4742431640625, -0.40887451171875, -0.343505859375, -0.27813720703125, -0.2127685546875, -0.14739990234375, -0.08203125, -0.01666259765625, 0.0487060546875, 0.11407470703125, 0.179443359375, 0.24481201171875, 0.3101806640625, 0.37554931640625, 0.44091796875, 0.50628662109375, 0.5716552734375, 0.63702392578125, 0.702392578125, 0.76776123046875, 0.8331298828125, 0.89849853515625, 0.9638671875, 1.02923583984375, 1.0946044921875, 1.15997314453125, 1.225341796875, 1.29071044921875, 1.3560791015625, 1.42144775390625, 1.48681640625, 1.55218505859375, 1.6175537109375, 1.68292236328125, 1.748291015625, 1.81365966796875, 1.8790283203125, 1.94439697265625, 2.009765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 6.0, 12.0, 12.0, 19.0, 62.0, 136.0, 269.0, 252.0, 116.0, 46.0, 18.0, 13.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00028252601623535156, -0.00027577951550483704, -0.0002690330147743225, -0.000262286514043808, -0.00025554001331329346, -0.00024879351258277893, -0.0002420470118522644, -0.00023530051112174988, -0.00022855401039123535, -0.00022180750966072083, -0.0002150610089302063, -0.00020831450819969177, -0.00020156800746917725, -0.00019482150673866272, -0.0001880750060081482, -0.00018132850527763367, -0.00017458200454711914, -0.00016783550381660461, -0.0001610890030860901, -0.00015434250235557556, -0.00014759600162506104, -0.0001408495008945465, -0.00013410300016403198, -0.00012735649943351746, -0.00012060999870300293, -0.0001138634979724884, -0.00010711699724197388, -0.00010037049651145935, -9.362399578094482e-05, -8.68774950504303e-05, -8.013099431991577e-05, -7.338449358940125e-05, -6.663799285888672e-05, -5.989149212837219e-05, -5.3144991397857666e-05, -4.639849066734314e-05, -3.965198993682861e-05, -3.290548920631409e-05, -2.615898847579956e-05, -1.9412487745285034e-05, -1.2665987014770508e-05, -5.9194862842559814e-06, 8.270144462585449e-07, 7.573515176773071e-06, 1.4320015907287598e-05, 2.1066516637802124e-05, 2.781301736831665e-05, 3.455951809883118e-05, 4.13060188293457e-05, 4.805251955986023e-05, 5.4799020290374756e-05, 6.154552102088928e-05, 6.829202175140381e-05, 7.503852248191833e-05, 8.178502321243286e-05, 8.853152394294739e-05, 9.527802467346191e-05, 0.00010202452540397644, 0.00010877102613449097, 0.00011551752686500549, 0.00012226402759552002, 0.00012901052832603455, 0.00013575702905654907, 0.0001425035297870636, 0.00014925003051757812]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 9.0, 7.0, 8.0, 26.0, 29.0, 46.0, 87.0, 121.0, 200.0, 422.0, 804.0, 1603.0, 3424.0, 7790.0, 20097.0, 60116.0, 178145.0, 335669.0, 272430.0, 109858.0, 35272.0, 12404.0, 5168.0, 2305.0, 1158.0, 576.0, 317.0, 192.0, 98.0, 58.0, 29.0, 23.0, 13.0, 16.0, 9.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5771484375, -0.5583877563476562, -0.5396270751953125, -0.5208663940429688, -0.502105712890625, -0.48334503173828125, -0.4645843505859375, -0.44582366943359375, -0.42706298828125, -0.40830230712890625, -0.3895416259765625, -0.37078094482421875, -0.352020263671875, -0.33325958251953125, -0.3144989013671875, -0.29573822021484375, -0.2769775390625, -0.25821685791015625, -0.2394561767578125, -0.22069549560546875, -0.201934814453125, -0.18317413330078125, -0.1644134521484375, -0.14565277099609375, -0.12689208984375, -0.10813140869140625, -0.0893707275390625, -0.07061004638671875, -0.051849365234375, -0.03308868408203125, -0.0143280029296875, 0.00443267822265625, 0.023193359375, 0.04195404052734375, 0.0607147216796875, 0.07947540283203125, 0.098236083984375, 0.11699676513671875, 0.1357574462890625, 0.15451812744140625, 0.17327880859375, 0.19203948974609375, 0.2108001708984375, 0.22956085205078125, 0.248321533203125, 0.26708221435546875, 0.2858428955078125, 0.30460357666015625, 0.3233642578125, 0.34212493896484375, 0.3608856201171875, 0.37964630126953125, 0.398406982421875, 0.41716766357421875, 0.4359283447265625, 0.45468902587890625, 0.47344970703125, 0.49221038818359375, 0.5109710693359375, 0.5297317504882812, 0.548492431640625, 0.5672531127929688, 0.5860137939453125, 0.6047744750976562, 0.62353515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 4.0, 1.0, 6.0, 14.0, 11.0, 20.0, 30.0, 25.0, 36.0, 37.0, 50.0, 66.0, 69.0, 59.0, 79.0, 71.0, 69.0, 51.0, 63.0, 50.0, 37.0, 40.0, 29.0, 22.0, 17.0, 13.0, 7.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.38330078125, -0.3715782165527344, -0.35985565185546875, -0.3481330871582031, -0.3364105224609375, -0.3246879577636719, -0.31296539306640625, -0.3012428283691406, -0.289520263671875, -0.2777976989746094, -0.26607513427734375, -0.2543525695800781, -0.2426300048828125, -0.23090744018554688, -0.21918487548828125, -0.20746231079101562, -0.19573974609375, -0.18401718139648438, -0.17229461669921875, -0.16057205200195312, -0.1488494873046875, -0.13712692260742188, -0.12540435791015625, -0.11368179321289062, -0.101959228515625, -0.09023666381835938, -0.07851409912109375, -0.06679153442382812, -0.0550689697265625, -0.043346405029296875, -0.03162384033203125, -0.019901275634765625, -0.0081787109375, 0.003543853759765625, 0.01526641845703125, 0.026988983154296875, 0.0387115478515625, 0.050434112548828125, 0.06215667724609375, 0.07387924194335938, 0.085601806640625, 0.09732437133789062, 0.10904693603515625, 0.12076950073242188, 0.1324920654296875, 0.14421463012695312, 0.15593719482421875, 0.16765975952148438, 0.17938232421875, 0.19110488891601562, 0.20282745361328125, 0.21455001831054688, 0.2262725830078125, 0.23799514770507812, 0.24971771240234375, 0.2614402770996094, 0.273162841796875, 0.2848854064941406, 0.29660797119140625, 0.3083305358886719, 0.3200531005859375, 0.3317756652832031, 0.34349822998046875, 0.3552207946777344, 0.366943359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 20.0, 112.0, 385.0, 371.0, 91.0, 22.0, 8.0, 0.0, 2.0, 2.0], "bins": [-26.549686431884766, -26.083263397216797, -25.616840362548828, -25.150415420532227, -24.683992385864258, -24.21756935119629, -23.75114631652832, -23.28472137451172, -22.81829833984375, -22.35187530517578, -21.885452270507812, -21.41902732849121, -20.952604293823242, -20.486181259155273, -20.019758224487305, -19.553333282470703, -19.086910247802734, -18.620487213134766, -18.154064178466797, -17.687639236450195, -17.221216201782227, -16.754793167114258, -16.28837013244629, -15.821946144104004, -15.355523109436035, -14.889100074768066, -14.422676086425781, -13.956253051757812, -13.489829063415527, -13.023406028747559, -12.556982040405273, -12.090559005737305, -11.624135971069336, -11.157712936401367, -10.691288948059082, -10.224865913391113, -9.758441925048828, -9.29201889038086, -8.825594902038574, -8.359171867370605, -7.89274787902832, -7.426324367523193, -6.959900856018066, -6.4934773445129395, -6.0270538330078125, -5.560630798339844, -5.094206809997559, -4.62778377532959, -4.161359786987305, -3.6949362754821777, -3.228512763977051, -2.762089252471924, -2.295665740966797, -1.829242467880249, -1.362818956375122, -0.8963954448699951, -0.42997217178344727, 0.0364513099193573, 0.5028747916221619, 0.969298243522644, 1.435721755027771, 1.9021451473236084, 2.3685686588287354, 2.8349921703338623, 3.3014156818389893]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 10.0, 11.0, 15.0, 9.0, 12.0, 25.0, 21.0, 21.0, 16.0, 15.0, 32.0, 47.0, 43.0, 45.0, 30.0, 51.0, 41.0, 46.0, 35.0, 42.0, 53.0, 35.0, 33.0, 36.0, 32.0, 33.0, 36.0, 27.0, 13.0, 22.0, 12.0, 13.0, 13.0, 11.0, 6.0, 12.0, 5.0, 2.0, 8.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.858982563018799, -2.7792370319366455, -2.6994917392730713, -2.619746208190918, -2.5400009155273438, -2.4602553844451904, -2.380510091781616, -2.300764560699463, -2.2210192680358887, -2.1412737369537354, -2.061528444290161, -1.9817830324172974, -1.9020376205444336, -1.8222920894622803, -1.7425466775894165, -1.6628012657165527, -1.5830557346343994, -1.5033103227615356, -1.4235649108886719, -1.343819499015808, -1.2640740871429443, -1.184328556060791, -1.1045831441879272, -1.0248377323150635, -0.9450923204421997, -0.8653469085693359, -0.7856014966964722, -0.7058560252189636, -0.6261106133460999, -0.5463652014732361, -0.4666197597980499, -0.38687431812286377, -0.30712890625, -0.22738347947597504, -0.14763805270195007, -0.06789262592792511, 0.011852800846099854, 0.09159821271896362, 0.17134365439414978, 0.25108909606933594, 0.3308345079421997, 0.4105799198150635, 0.49032536149024963, 0.5700708031654358, 0.6498162150382996, 0.7295616269111633, 0.8093070983886719, 0.8890525102615356, 0.9687979221343994, 1.0485433340072632, 1.128288745880127, 1.2080341577529907, 1.2877795696258545, 1.3675251007080078, 1.4472705125808716, 1.5270159244537354, 1.6067613363265991, 1.686506748199463, 1.7662521600723267, 1.8459975719451904, 1.9257431030273438, 2.005488395690918, 2.0852339267730713, 2.1649794578552246, 2.244724750518799]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 12.0, 8.0, 10.0, 21.0, 28.0, 25.0, 54.0, 71.0, 122.0, 142.0, 227.0, 337.0, 716.0, 1276.0, 2590.0, 5699.0, 13735.0, 38591.0, 127730.0, 550357.0, 1825813.0, 1228133.0, 282822.0, 73650.0, 24299.0, 9500.0, 4056.0, 1883.0, 999.0, 516.0, 331.0, 167.0, 105.0, 72.0, 53.0, 30.0, 25.0, 22.0, 15.0, 3.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.79150390625, -0.7680740356445312, -0.7446441650390625, -0.7212142944335938, -0.697784423828125, -0.6743545532226562, -0.6509246826171875, -0.6274948120117188, -0.60406494140625, -0.5806350708007812, -0.5572052001953125, -0.5337753295898438, -0.510345458984375, -0.48691558837890625, -0.4634857177734375, -0.44005584716796875, -0.4166259765625, -0.39319610595703125, -0.3697662353515625, -0.34633636474609375, -0.322906494140625, -0.29947662353515625, -0.2760467529296875, -0.25261688232421875, -0.22918701171875, -0.20575714111328125, -0.1823272705078125, -0.15889739990234375, -0.135467529296875, -0.11203765869140625, -0.0886077880859375, -0.06517791748046875, -0.041748046875, -0.01831817626953125, 0.0051116943359375, 0.02854156494140625, 0.051971435546875, 0.07540130615234375, 0.0988311767578125, 0.12226104736328125, 0.14569091796875, 0.16912078857421875, 0.1925506591796875, 0.21598052978515625, 0.239410400390625, 0.26284027099609375, 0.2862701416015625, 0.30970001220703125, 0.3331298828125, 0.35655975341796875, 0.3799896240234375, 0.40341949462890625, 0.426849365234375, 0.45027923583984375, 0.4737091064453125, 0.49713897705078125, 0.52056884765625, 0.5439987182617188, 0.5674285888671875, 0.5908584594726562, 0.614288330078125, 0.6377182006835938, 0.6611480712890625, 0.6845779418945312, 0.7080078125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 11.0, 2.0, 12.0, 12.0, 14.0, 18.0, 29.0, 49.0, 43.0, 43.0, 59.0, 66.0, 49.0, 52.0, 71.0, 58.0, 60.0, 60.0, 54.0, 55.0, 37.0, 24.0, 26.0, 25.0, 21.0, 12.0, 9.0, 11.0, 4.0, 2.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5242462158203125, -0.506988525390625, -0.4897308349609375, -0.47247314453125, -0.4552154541015625, -0.437957763671875, -0.4207000732421875, -0.4034423828125, -0.3861846923828125, -0.368927001953125, -0.3516693115234375, -0.33441162109375, -0.3171539306640625, -0.299896240234375, -0.2826385498046875, -0.265380859375, -0.2481231689453125, -0.230865478515625, -0.2136077880859375, -0.19635009765625, -0.1790924072265625, -0.161834716796875, -0.1445770263671875, -0.1273193359375, -0.1100616455078125, -0.092803955078125, -0.0755462646484375, -0.05828857421875, -0.0410308837890625, -0.023773193359375, -0.0065155029296875, 0.0107421875, 0.0279998779296875, 0.045257568359375, 0.0625152587890625, 0.07977294921875, 0.0970306396484375, 0.114288330078125, 0.1315460205078125, 0.1488037109375, 0.1660614013671875, 0.183319091796875, 0.2005767822265625, 0.21783447265625, 0.2350921630859375, 0.252349853515625, 0.2696075439453125, 0.286865234375, 0.3041229248046875, 0.321380615234375, 0.3386383056640625, 0.35589599609375, 0.3731536865234375, 0.390411376953125, 0.4076690673828125, 0.4249267578125, 0.4421844482421875, 0.459442138671875, 0.4766998291015625, 0.49395751953125, 0.5112152099609375, 0.528472900390625, 0.5457305908203125, 0.56298828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 9.0, 19.0, 35.0, 56.0, 107.0, 177.0, 383.0, 846.0, 2286.0, 8105.0, 37345.0, 212131.0, 1219162.0, 2085442.0, 519408.0, 85590.0, 16579.0, 4140.0, 1351.0, 529.0, 252.0, 139.0, 72.0, 46.0, 26.0, 16.0, 12.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.373046875, -1.3340911865234375, -1.295135498046875, -1.2561798095703125, -1.21722412109375, -1.1782684326171875, -1.139312744140625, -1.1003570556640625, -1.0614013671875, -1.0224456787109375, -0.983489990234375, -0.9445343017578125, -0.90557861328125, -0.8666229248046875, -0.827667236328125, -0.7887115478515625, -0.749755859375, -0.7108001708984375, -0.671844482421875, -0.6328887939453125, -0.59393310546875, -0.5549774169921875, -0.516021728515625, -0.4770660400390625, -0.4381103515625, -0.3991546630859375, -0.360198974609375, -0.3212432861328125, -0.28228759765625, -0.2433319091796875, -0.204376220703125, -0.1654205322265625, -0.12646484375, -0.0875091552734375, -0.048553466796875, -0.0095977783203125, 0.02935791015625, 0.0683135986328125, 0.107269287109375, 0.1462249755859375, 0.1851806640625, 0.2241363525390625, 0.263092041015625, 0.3020477294921875, 0.34100341796875, 0.3799591064453125, 0.418914794921875, 0.4578704833984375, 0.496826171875, 0.5357818603515625, 0.574737548828125, 0.6136932373046875, 0.65264892578125, 0.6916046142578125, 0.730560302734375, 0.7695159912109375, 0.8084716796875, 0.8474273681640625, 0.886383056640625, 0.9253387451171875, 0.96429443359375, 1.0032501220703125, 1.042205810546875, 1.0811614990234375, 1.1201171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 5.0, 5.0, 11.0, 14.0, 19.0, 26.0, 46.0, 68.0, 93.0, 125.0, 171.0, 245.0, 291.0, 319.0, 391.0, 454.0, 373.0, 355.0, 262.0, 219.0, 160.0, 113.0, 88.0, 67.0, 46.0, 23.0, 29.0, 15.0, 14.0, 10.0, 12.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7744140625, -0.74810791015625, -0.7218017578125, -0.69549560546875, -0.669189453125, -0.64288330078125, -0.6165771484375, -0.59027099609375, -0.56396484375, -0.53765869140625, -0.5113525390625, -0.48504638671875, -0.458740234375, -0.43243408203125, -0.4061279296875, -0.37982177734375, -0.353515625, -0.32720947265625, -0.3009033203125, -0.27459716796875, -0.248291015625, -0.22198486328125, -0.1956787109375, -0.16937255859375, -0.14306640625, -0.11676025390625, -0.0904541015625, -0.06414794921875, -0.037841796875, -0.01153564453125, 0.0147705078125, 0.04107666015625, 0.0673828125, 0.09368896484375, 0.1199951171875, 0.14630126953125, 0.172607421875, 0.19891357421875, 0.2252197265625, 0.25152587890625, 0.27783203125, 0.30413818359375, 0.3304443359375, 0.35675048828125, 0.383056640625, 0.40936279296875, 0.4356689453125, 0.46197509765625, 0.48828125, 0.51458740234375, 0.5408935546875, 0.56719970703125, 0.593505859375, 0.61981201171875, 0.6461181640625, 0.67242431640625, 0.69873046875, 0.72503662109375, 0.7513427734375, 0.77764892578125, 0.803955078125, 0.83026123046875, 0.8565673828125, 0.88287353515625, 0.9091796875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 8.0, 18.0, 20.0, 44.0, 59.0, 83.0, 99.0, 110.0, 108.0, 113.0, 90.0, 86.0, 58.0, 43.0, 22.0, 17.0, 11.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.126149654388428, -5.982048988342285, -5.837948322296143, -5.693848133087158, -5.549747467041016, -5.405646800994873, -5.2615461349487305, -5.117445468902588, -4.973344802856445, -4.829244136810303, -4.68514347076416, -4.541043281555176, -4.396942615509033, -4.252841949462891, -4.108741283416748, -3.9646406173706055, -3.820540428161621, -3.6764397621154785, -3.532339334487915, -3.3882386684417725, -3.244138240814209, -3.1000375747680664, -2.955936908721924, -2.8118362426757812, -2.6677358150482178, -2.523635149002075, -2.3795347213745117, -2.235434055328369, -2.0913333892822266, -1.947232961654663, -1.8031322956085205, -1.6590317487716675, -1.5149307250976562, -1.3708301782608032, -1.2267296314239502, -1.0826289653778076, -0.9385284185409546, -0.7944278717041016, -0.6503272652626038, -0.506226658821106, -0.36212611198425293, -0.21802553534507751, -0.0739249587059021, 0.07017561793327332, 0.21427619457244873, 0.35837674140930176, 0.5024773478507996, 0.6465779542922974, 0.7906785011291504, 0.9347790479660034, 1.0788795948028564, 1.222980260848999, 1.367080807685852, 1.511181354522705, 1.6552820205688477, 1.7993825674057007, 1.9434831142425537, 2.0875837802886963, 2.2316842079162598, 2.3757848739624023, 2.519885540008545, 2.6639859676361084, 2.808086633682251, 2.9521870613098145, 3.096287727355957]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 2.0, 4.0, 6.0, 10.0, 13.0, 14.0, 16.0, 10.0, 14.0, 20.0, 29.0, 24.0, 26.0, 37.0, 29.0, 44.0, 37.0, 26.0, 40.0, 41.0, 31.0, 52.0, 29.0, 46.0, 44.0, 43.0, 43.0, 39.0, 29.0, 32.0, 24.0, 24.0, 26.0, 15.0, 19.0, 10.0, 13.0, 12.0, 12.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.309464454650879, -2.230226755142212, -2.150989294052124, -2.071751594543457, -1.9925140142440796, -1.9132764339447021, -1.8340388536453247, -1.7548012733459473, -1.6755635738372803, -1.5963259935379028, -1.5170884132385254, -1.4378507137298584, -1.358613133430481, -1.2793755531311035, -1.200137972831726, -1.1209003925323486, -1.0416628122329712, -0.9624252319335938, -0.8831875920295715, -0.8039500117301941, -0.7247123718261719, -0.6454747915267944, -0.566237211227417, -0.4869995713233948, -0.40776199102401733, -0.3285243809223175, -0.24928678572177887, -0.17004919052124023, -0.0908115804195404, -0.011573970317840576, 0.06766360998153687, 0.14690124988555908, 0.22613883018493652, 0.30537644028663635, 0.3846140503883362, 0.4638516306877136, 0.5430892705917358, 0.6223268508911133, 0.7015644311904907, 0.7808020710945129, 0.8600396513938904, 0.9392772316932678, 1.01851487159729, 1.0977524518966675, 1.176990032196045, 1.256227731704712, 1.3354651927947998, 1.4147028923034668, 1.4939404726028442, 1.5731780529022217, 1.6524156332015991, 1.7316532135009766, 1.8108909130096436, 1.890128493309021, 1.9693660736083984, 2.0486037731170654, 2.1278412342071533, 2.2070789337158203, 2.286316394805908, 2.365554094314575, 2.444791555404663, 2.52402925491333, 2.603266716003418, 2.682504415512085, 2.761742115020752]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 8.0, 5.0, 11.0, 12.0, 27.0, 34.0, 53.0, 77.0, 118.0, 254.0, 398.0, 768.0, 1654.0, 3742.0, 9136.0, 23144.0, 62629.0, 165004.0, 326173.0, 270233.0, 114590.0, 42603.0, 16100.0, 6426.0, 2656.0, 1248.0, 611.0, 318.0, 190.0, 116.0, 62.0, 41.0, 36.0, 21.0, 13.0, 8.0, 5.0, 6.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.6435546875, -1.594940185546875, -1.54632568359375, -1.497711181640625, -1.4490966796875, -1.400482177734375, -1.35186767578125, -1.303253173828125, -1.254638671875, -1.206024169921875, -1.15740966796875, -1.108795166015625, -1.0601806640625, -1.011566162109375, -0.96295166015625, -0.914337158203125, -0.86572265625, -0.817108154296875, -0.76849365234375, -0.719879150390625, -0.6712646484375, -0.622650146484375, -0.57403564453125, -0.525421142578125, -0.476806640625, -0.428192138671875, -0.37957763671875, -0.330963134765625, -0.2823486328125, -0.233734130859375, -0.18511962890625, -0.136505126953125, -0.087890625, -0.039276123046875, 0.00933837890625, 0.057952880859375, 0.1065673828125, 0.155181884765625, 0.20379638671875, 0.252410888671875, 0.301025390625, 0.349639892578125, 0.39825439453125, 0.446868896484375, 0.4954833984375, 0.544097900390625, 0.59271240234375, 0.641326904296875, 0.68994140625, 0.738555908203125, 0.78717041015625, 0.835784912109375, 0.8843994140625, 0.933013916015625, 0.98162841796875, 1.030242919921875, 1.078857421875, 1.127471923828125, 1.17608642578125, 1.224700927734375, 1.2733154296875, 1.321929931640625, 1.37054443359375, 1.419158935546875, 1.4677734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 3.0, 12.0, 20.0, 22.0, 20.0, 26.0, 32.0, 30.0, 33.0, 55.0, 54.0, 51.0, 59.0, 56.0, 53.0, 64.0, 63.0, 57.0, 45.0, 46.0, 39.0, 26.0, 23.0, 29.0, 12.0, 17.0, 12.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48681640625, -0.47115325927734375, -0.4554901123046875, -0.43982696533203125, -0.424163818359375, -0.40850067138671875, -0.3928375244140625, -0.37717437744140625, -0.36151123046875, -0.34584808349609375, -0.3301849365234375, -0.31452178955078125, -0.298858642578125, -0.28319549560546875, -0.2675323486328125, -0.25186920166015625, -0.2362060546875, -0.22054290771484375, -0.2048797607421875, -0.18921661376953125, -0.173553466796875, -0.15789031982421875, -0.1422271728515625, -0.12656402587890625, -0.11090087890625, -0.09523773193359375, -0.0795745849609375, -0.06391143798828125, -0.048248291015625, -0.03258514404296875, -0.0169219970703125, -0.00125885009765625, 0.014404296875, 0.03006744384765625, 0.0457305908203125, 0.06139373779296875, 0.077056884765625, 0.09272003173828125, 0.1083831787109375, 0.12404632568359375, 0.13970947265625, 0.15537261962890625, 0.1710357666015625, 0.18669891357421875, 0.202362060546875, 0.21802520751953125, 0.2336883544921875, 0.24935150146484375, 0.2650146484375, 0.28067779541015625, 0.2963409423828125, 0.31200408935546875, 0.327667236328125, 0.34333038330078125, 0.3589935302734375, 0.37465667724609375, 0.39031982421875, 0.40598297119140625, 0.4216461181640625, 0.43730926513671875, 0.452972412109375, 0.46863555908203125, 0.4842987060546875, 0.49996185302734375, 0.515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 10.0, 10.0, 17.0, 21.0, 17.0, 38.0, 60.0, 86.0, 164.0, 264.0, 516.0, 1015.0, 1903.0, 3713.0, 7316.0, 14493.0, 29491.0, 58592.0, 114167.0, 197285.0, 240098.0, 178022.0, 99873.0, 51100.0, 25092.0, 12424.0, 6178.0, 3036.0, 1603.0, 857.0, 447.0, 255.0, 135.0, 91.0, 53.0, 36.0, 20.0, 19.0, 13.0, 9.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.236328125, -1.20037841796875, -1.1644287109375, -1.12847900390625, -1.092529296875, -1.05657958984375, -1.0206298828125, -0.98468017578125, -0.94873046875, -0.91278076171875, -0.8768310546875, -0.84088134765625, -0.804931640625, -0.76898193359375, -0.7330322265625, -0.69708251953125, -0.6611328125, -0.62518310546875, -0.5892333984375, -0.55328369140625, -0.517333984375, -0.48138427734375, -0.4454345703125, -0.40948486328125, -0.37353515625, -0.33758544921875, -0.3016357421875, -0.26568603515625, -0.229736328125, -0.19378662109375, -0.1578369140625, -0.12188720703125, -0.0859375, -0.04998779296875, -0.0140380859375, 0.02191162109375, 0.057861328125, 0.09381103515625, 0.1297607421875, 0.16571044921875, 0.20166015625, 0.23760986328125, 0.2735595703125, 0.30950927734375, 0.345458984375, 0.38140869140625, 0.4173583984375, 0.45330810546875, 0.4892578125, 0.52520751953125, 0.5611572265625, 0.59710693359375, 0.633056640625, 0.66900634765625, 0.7049560546875, 0.74090576171875, 0.77685546875, 0.81280517578125, 0.8487548828125, 0.88470458984375, 0.920654296875, 0.95660400390625, 0.9925537109375, 1.02850341796875, 1.064453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 12.0, 12.0, 10.0, 23.0, 19.0, 28.0, 22.0, 23.0, 38.0, 25.0, 35.0, 29.0, 37.0, 38.0, 39.0, 42.0, 39.0, 43.0, 41.0, 40.0, 48.0, 38.0, 35.0, 36.0, 29.0, 39.0, 23.0, 30.0, 25.0, 18.0, 11.0, 15.0, 8.0, 4.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8369140625, -0.805908203125, -0.77490234375, -0.743896484375, -0.712890625, -0.681884765625, -0.65087890625, -0.619873046875, -0.5888671875, -0.557861328125, -0.52685546875, -0.495849609375, -0.46484375, -0.433837890625, -0.40283203125, -0.371826171875, -0.3408203125, -0.309814453125, -0.27880859375, -0.247802734375, -0.216796875, -0.185791015625, -0.15478515625, -0.123779296875, -0.0927734375, -0.061767578125, -0.03076171875, 0.000244140625, 0.03125, 0.062255859375, 0.09326171875, 0.124267578125, 0.1552734375, 0.186279296875, 0.21728515625, 0.248291015625, 0.279296875, 0.310302734375, 0.34130859375, 0.372314453125, 0.4033203125, 0.434326171875, 0.46533203125, 0.496337890625, 0.52734375, 0.558349609375, 0.58935546875, 0.620361328125, 0.6513671875, 0.682373046875, 0.71337890625, 0.744384765625, 0.775390625, 0.806396484375, 0.83740234375, 0.868408203125, 0.8994140625, 0.930419921875, 0.96142578125, 0.992431640625, 1.0234375, 1.054443359375, 1.08544921875, 1.116455078125, 1.1474609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 9.0, 13.0, 19.0, 20.0, 32.0, 62.0, 63.0, 108.0, 148.0, 210.0, 322.0, 615.0, 1099.0, 2492.0, 7153.0, 31724.0, 206720.0, 568766.0, 188792.0, 28442.0, 6769.0, 2304.0, 1056.0, 578.0, 390.0, 188.0, 132.0, 118.0, 45.0, 44.0, 41.0, 19.0, 20.0, 15.0, 11.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.2513275146484375, -1.205780029296875, -1.1602325439453125, -1.11468505859375, -1.0691375732421875, -1.023590087890625, -0.9780426025390625, -0.9324951171875, -0.8869476318359375, -0.841400146484375, -0.7958526611328125, -0.75030517578125, -0.7047576904296875, -0.659210205078125, -0.6136627197265625, -0.568115234375, -0.5225677490234375, -0.477020263671875, -0.4314727783203125, -0.38592529296875, -0.3403778076171875, -0.294830322265625, -0.2492828369140625, -0.2037353515625, -0.1581878662109375, -0.112640380859375, -0.0670928955078125, -0.02154541015625, 0.0240020751953125, 0.069549560546875, 0.1150970458984375, 0.16064453125, 0.2061920166015625, 0.251739501953125, 0.2972869873046875, 0.34283447265625, 0.3883819580078125, 0.433929443359375, 0.4794769287109375, 0.5250244140625, 0.5705718994140625, 0.616119384765625, 0.6616668701171875, 0.70721435546875, 0.7527618408203125, 0.798309326171875, 0.8438568115234375, 0.889404296875, 0.9349517822265625, 0.980499267578125, 1.0260467529296875, 1.07159423828125, 1.1171417236328125, 1.162689208984375, 1.2082366943359375, 1.2537841796875, 1.2993316650390625, 1.344879150390625, 1.3904266357421875, 1.43597412109375, 1.4815216064453125, 1.527069091796875, 1.5726165771484375, 1.6181640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 11.0, 25.0, 36.0, 91.0, 176.0, 244.0, 206.0, 96.0, 50.0, 23.0, 17.0, 14.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037384033203125, -0.0003646276891231537, -0.0003554150462150574, -0.00034620240330696106, -0.00033698976039886475, -0.00032777711749076843, -0.0003185644745826721, -0.0003093518316745758, -0.0003001391887664795, -0.0002909265458583832, -0.00028171390295028687, -0.00027250126004219055, -0.00026328861713409424, -0.0002540759742259979, -0.0002448633313179016, -0.0002356506884098053, -0.00022643804550170898, -0.00021722540259361267, -0.00020801275968551636, -0.00019880011677742004, -0.00018958747386932373, -0.00018037483096122742, -0.0001711621880531311, -0.0001619495451450348, -0.00015273690223693848, -0.00014352425932884216, -0.00013431161642074585, -0.00012509897351264954, -0.00011588633060455322, -0.00010667368769645691, -9.74610447883606e-05, -8.824840188026428e-05, -7.903575897216797e-05, -6.982311606407166e-05, -6.061047315597534e-05, -5.139783024787903e-05, -4.2185187339782715e-05, -3.29725444316864e-05, -2.3759901523590088e-05, -1.4547258615493774e-05, -5.334615707397461e-06, 3.8780272006988525e-06, 1.3090670108795166e-05, 2.230331301689148e-05, 3.151595592498779e-05, 4.0728598833084106e-05, 4.994124174118042e-05, 5.9153884649276733e-05, 6.836652755737305e-05, 7.757917046546936e-05, 8.679181337356567e-05, 9.600445628166199e-05, 0.0001052170991897583, 0.00011442974209785461, 0.00012364238500595093, 0.00013285502791404724, 0.00014206767082214355, 0.00015128031373023987, 0.00016049295663833618, 0.0001697055995464325, 0.0001789182424545288, 0.00018813088536262512, 0.00019734352827072144, 0.00020655617117881775, 0.00021576881408691406]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 19.0, 21.0, 31.0, 46.0, 55.0, 108.0, 128.0, 208.0, 323.0, 551.0, 890.0, 1621.0, 2719.0, 5220.0, 10366.0, 20769.0, 42923.0, 86481.0, 155435.0, 216951.0, 209614.0, 141067.0, 76597.0, 37926.0, 18241.0, 9227.0, 4803.0, 2515.0, 1421.0, 882.0, 485.0, 305.0, 206.0, 123.0, 81.0, 52.0, 46.0, 32.0, 18.0, 9.0, 9.0, 7.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.4001960754394531, -0.38681793212890625, -0.3734397888183594, -0.3600616455078125, -0.3466835021972656, -0.33330535888671875, -0.3199272155761719, -0.306549072265625, -0.2931709289550781, -0.27979278564453125, -0.2664146423339844, -0.2530364990234375, -0.23965835571289062, -0.22628021240234375, -0.21290206909179688, -0.19952392578125, -0.18614578247070312, -0.17276763916015625, -0.15938949584960938, -0.1460113525390625, -0.13263320922851562, -0.11925506591796875, -0.10587692260742188, -0.092498779296875, -0.07912063598632812, -0.06574249267578125, -0.052364349365234375, -0.0389862060546875, -0.025608062744140625, -0.01222991943359375, 0.001148223876953125, 0.0145263671875, 0.027904510498046875, 0.04128265380859375, 0.054660797119140625, 0.0680389404296875, 0.08141708374023438, 0.09479522705078125, 0.10817337036132812, 0.121551513671875, 0.13492965698242188, 0.14830780029296875, 0.16168594360351562, 0.1750640869140625, 0.18844223022460938, 0.20182037353515625, 0.21519851684570312, 0.22857666015625, 0.24195480346679688, 0.25533294677734375, 0.2687110900878906, 0.2820892333984375, 0.2954673767089844, 0.30884552001953125, 0.3222236633300781, 0.335601806640625, 0.3489799499511719, 0.36235809326171875, 0.3757362365722656, 0.3891143798828125, 0.4024925231933594, 0.41587066650390625, 0.4292488098144531, 0.442626953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 9.0, 10.0, 8.0, 4.0, 9.0, 21.0, 29.0, 19.0, 29.0, 39.0, 48.0, 51.0, 51.0, 55.0, 64.0, 64.0, 70.0, 55.0, 57.0, 49.0, 39.0, 41.0, 24.0, 27.0, 24.0, 29.0, 15.0, 11.0, 8.0, 11.0, 8.0, 3.0, 2.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3837890625, -0.372039794921875, -0.36029052734375, -0.348541259765625, -0.3367919921875, -0.325042724609375, -0.31329345703125, -0.301544189453125, -0.289794921875, -0.278045654296875, -0.26629638671875, -0.254547119140625, -0.2427978515625, -0.231048583984375, -0.21929931640625, -0.207550048828125, -0.19580078125, -0.184051513671875, -0.17230224609375, -0.160552978515625, -0.1488037109375, -0.137054443359375, -0.12530517578125, -0.113555908203125, -0.101806640625, -0.090057373046875, -0.07830810546875, -0.066558837890625, -0.0548095703125, -0.043060302734375, -0.03131103515625, -0.019561767578125, -0.0078125, 0.003936767578125, 0.01568603515625, 0.027435302734375, 0.0391845703125, 0.050933837890625, 0.06268310546875, 0.074432373046875, 0.086181640625, 0.097930908203125, 0.10968017578125, 0.121429443359375, 0.1331787109375, 0.144927978515625, 0.15667724609375, 0.168426513671875, 0.18017578125, 0.191925048828125, 0.20367431640625, 0.215423583984375, 0.2271728515625, 0.238922119140625, 0.25067138671875, 0.262420654296875, 0.274169921875, 0.285919189453125, 0.29766845703125, 0.309417724609375, 0.3211669921875, 0.332916259765625, 0.34466552734375, 0.356414794921875, 0.3681640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 11.0, 15.0, 20.0, 29.0, 36.0, 42.0, 54.0, 80.0, 98.0, 101.0, 88.0, 83.0, 74.0, 64.0, 49.0, 36.0, 30.0, 25.0, 20.0, 8.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.323822975158691, -5.1911516189575195, -5.058480262756348, -4.925808906555176, -4.793137550354004, -4.660466194152832, -4.52779483795166, -4.395123481750488, -4.262452125549316, -4.1297807693481445, -3.9971094131469727, -3.864438056945801, -3.731766700744629, -3.599095344543457, -3.466423749923706, -3.333752393722534, -3.201080799102783, -3.0684094429016113, -2.9357380867004395, -2.8030667304992676, -2.6703953742980957, -2.537724018096924, -2.405052423477173, -2.272381067276001, -2.139709711074829, -2.0070383548736572, -1.8743669986724854, -1.741695523262024, -1.609024167060852, -1.4763528108596802, -1.3436813354492188, -1.2110099792480469, -1.078338861465454, -0.9456675052642822, -0.8129960894584656, -0.6803246736526489, -0.547653317451477, -0.4149819612503052, -0.2823105454444885, -0.14963912963867188, -0.0169677734375, 0.11570361256599426, 0.24837499856948853, 0.3810463845729828, 0.513717770576477, 0.6463891267776489, 0.7790605425834656, 0.9117319583892822, 1.044403314590454, 1.177074670791626, 1.3097460269927979, 1.4424175024032593, 1.5750888586044312, 1.707760214805603, 1.8404316902160645, 1.9731030464172363, 2.105774402618408, 2.23844575881958, 2.371117115020752, 2.503788471221924, 2.6364598274230957, 2.7691311836242676, 2.9018027782440186, 3.0344741344451904, 3.1671454906463623]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 12.0, 5.0, 13.0, 17.0, 20.0, 21.0, 11.0, 31.0, 29.0, 34.0, 30.0, 41.0, 46.0, 35.0, 40.0, 50.0, 47.0, 52.0, 55.0, 52.0, 58.0, 41.0, 28.0, 31.0, 54.0, 33.0, 17.0, 23.0, 15.0, 9.0, 9.0, 6.0, 12.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3858189582824707, -3.2768642902374268, -3.167909860610962, -3.058955192565918, -2.950000762939453, -2.841046094894409, -2.7320914268493652, -2.6231369972229004, -2.5141823291778564, -2.4052276611328125, -2.2962732315063477, -2.1873185634613037, -2.078364133834839, -1.969409465789795, -1.8604549169540405, -1.7515003681182861, -1.6425458192825317, -1.5335912704467773, -1.424636721611023, -1.3156821727752686, -1.2067275047302246, -1.0977729558944702, -0.9888184070587158, -0.8798637986183167, -0.7709092497825623, -0.6619547009468079, -0.5530000925064087, -0.4440455436706543, -0.3350909650325775, -0.22613638639450073, -0.11718183755874634, -0.008227229118347168, 0.10072731971740723, 0.209681898355484, 0.3186364769935608, 0.4275910258293152, 0.5365456342697144, 0.6455001831054688, 0.7544547319412231, 0.8634093403816223, 0.9723638892173767, 1.0813184976577759, 1.1902730464935303, 1.2992275953292847, 1.408182144165039, 1.517136812210083, 1.6260912418365479, 1.7350459098815918, 1.8440004587173462, 1.9529550075531006, 2.0619096755981445, 2.1708641052246094, 2.2798187732696533, 2.3887734413146973, 2.497727870941162, 2.606682538986206, 2.715636968612671, 2.824591636657715, 2.9335460662841797, 3.0425007343292236, 3.1514551639556885, 3.2604098320007324, 3.3693642616271973, 3.478318929672241, 3.587273597717285]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 9.0, 8.0, 17.0, 21.0, 45.0, 74.0, 90.0, 163.0, 395.0, 1362.0, 11133.0, 253314.0, 3607779.0, 305916.0, 11853.0, 1364.0, 357.0, 136.0, 79.0, 56.0, 35.0, 21.0, 19.0, 11.0, 10.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.2151336669921875, -2.150970458984375, -2.0868072509765625, -2.02264404296875, -1.9584808349609375, -1.894317626953125, -1.8301544189453125, -1.7659912109375, -1.7018280029296875, -1.637664794921875, -1.5735015869140625, -1.50933837890625, -1.4451751708984375, -1.381011962890625, -1.3168487548828125, -1.252685546875, -1.1885223388671875, -1.124359130859375, -1.0601959228515625, -0.99603271484375, -0.9318695068359375, -0.867706298828125, -0.8035430908203125, -0.7393798828125, -0.6752166748046875, -0.611053466796875, -0.5468902587890625, -0.48272705078125, -0.4185638427734375, -0.354400634765625, -0.2902374267578125, -0.22607421875, -0.1619110107421875, -0.097747802734375, -0.0335845947265625, 0.03057861328125, 0.0947418212890625, 0.158905029296875, 0.2230682373046875, 0.2872314453125, 0.3513946533203125, 0.415557861328125, 0.4797210693359375, 0.54388427734375, 0.6080474853515625, 0.672210693359375, 0.7363739013671875, 0.800537109375, 0.8647003173828125, 0.928863525390625, 0.9930267333984375, 1.05718994140625, 1.1213531494140625, 1.185516357421875, 1.2496795654296875, 1.3138427734375, 1.3780059814453125, 1.442169189453125, 1.5063323974609375, 1.57049560546875, 1.6346588134765625, 1.698822021484375, 1.7629852294921875, 1.8271484375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 4.0, 8.0, 8.0, 12.0, 16.0, 15.0, 19.0, 23.0, 23.0, 29.0, 27.0, 46.0, 46.0, 43.0, 64.0, 55.0, 51.0, 56.0, 76.0, 49.0, 44.0, 48.0, 42.0, 27.0, 38.0, 28.0, 25.0, 19.0, 14.0, 12.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.51318359375, -0.4976463317871094, -0.48210906982421875, -0.4665718078613281, -0.4510345458984375, -0.4354972839355469, -0.41996002197265625, -0.4044227600097656, -0.388885498046875, -0.3733482360839844, -0.35781097412109375, -0.3422737121582031, -0.3267364501953125, -0.3111991882324219, -0.29566192626953125, -0.2801246643066406, -0.26458740234375, -0.24905014038085938, -0.23351287841796875, -0.21797561645507812, -0.2024383544921875, -0.18690109252929688, -0.17136383056640625, -0.15582656860351562, -0.140289306640625, -0.12475204467773438, -0.10921478271484375, -0.09367752075195312, -0.0781402587890625, -0.06260299682617188, -0.04706573486328125, -0.031528472900390625, -0.0159912109375, -0.000453948974609375, 0.01508331298828125, 0.030620574951171875, 0.0461578369140625, 0.061695098876953125, 0.07723236083984375, 0.09276962280273438, 0.108306884765625, 0.12384414672851562, 0.13938140869140625, 0.15491867065429688, 0.1704559326171875, 0.18599319458007812, 0.20153045654296875, 0.21706771850585938, 0.23260498046875, 0.24814224243164062, 0.26367950439453125, 0.2792167663574219, 0.2947540283203125, 0.3102912902832031, 0.32582855224609375, 0.3413658142089844, 0.356903076171875, 0.3724403381347656, 0.38797760009765625, 0.4035148620605469, 0.4190521240234375, 0.4345893859863281, 0.45012664794921875, 0.4656639099121094, 0.481201171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 13.0, 5.0, 12.0, 24.0, 28.0, 46.0, 90.0, 118.0, 246.0, 506.0, 967.0, 2353.0, 7023.0, 28116.0, 137330.0, 737686.0, 2113079.0, 940464.0, 177502.0, 34880.0, 8717.0, 2759.0, 1118.0, 534.0, 284.0, 156.0, 69.0, 57.0, 27.0, 29.0, 21.0, 7.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.421875, -1.3868331909179688, -1.3517913818359375, -1.3167495727539062, -1.281707763671875, -1.2466659545898438, -1.2116241455078125, -1.1765823364257812, -1.14154052734375, -1.1064987182617188, -1.0714569091796875, -1.0364151000976562, -1.001373291015625, -0.9663314819335938, -0.9312896728515625, -0.8962478637695312, -0.8612060546875, -0.8261642456054688, -0.7911224365234375, -0.7560806274414062, -0.721038818359375, -0.6859970092773438, -0.6509552001953125, -0.6159133911132812, -0.58087158203125, -0.5458297729492188, -0.5107879638671875, -0.47574615478515625, -0.440704345703125, -0.40566253662109375, -0.3706207275390625, -0.33557891845703125, -0.300537109375, -0.26549530029296875, -0.2304534912109375, -0.19541168212890625, -0.160369873046875, -0.12532806396484375, -0.0902862548828125, -0.05524444580078125, -0.02020263671875, 0.01483917236328125, 0.0498809814453125, 0.08492279052734375, 0.119964599609375, 0.15500640869140625, 0.1900482177734375, 0.22509002685546875, 0.2601318359375, 0.29517364501953125, 0.3302154541015625, 0.36525726318359375, 0.400299072265625, 0.43534088134765625, 0.4703826904296875, 0.5054244995117188, 0.54046630859375, 0.5755081176757812, 0.6105499267578125, 0.6455917358398438, 0.680633544921875, 0.7156753540039062, 0.7507171630859375, 0.7857589721679688, 0.82080078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 9.0, 8.0, 18.0, 15.0, 38.0, 35.0, 55.0, 73.0, 99.0, 159.0, 198.0, 239.0, 283.0, 332.0, 355.0, 397.0, 359.0, 321.0, 261.0, 228.0, 151.0, 128.0, 81.0, 71.0, 39.0, 28.0, 31.0, 20.0, 18.0, 6.0, 5.0, 2.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61962890625, -0.596099853515625, -0.57257080078125, -0.549041748046875, -0.5255126953125, -0.501983642578125, -0.47845458984375, -0.454925537109375, -0.431396484375, -0.407867431640625, -0.38433837890625, -0.360809326171875, -0.3372802734375, -0.313751220703125, -0.29022216796875, -0.266693115234375, -0.2431640625, -0.219635009765625, -0.19610595703125, -0.172576904296875, -0.1490478515625, -0.125518798828125, -0.10198974609375, -0.078460693359375, -0.054931640625, -0.031402587890625, -0.00787353515625, 0.015655517578125, 0.0391845703125, 0.062713623046875, 0.08624267578125, 0.109771728515625, 0.13330078125, 0.156829833984375, 0.18035888671875, 0.203887939453125, 0.2274169921875, 0.250946044921875, 0.27447509765625, 0.298004150390625, 0.321533203125, 0.345062255859375, 0.36859130859375, 0.392120361328125, 0.4156494140625, 0.439178466796875, 0.46270751953125, 0.486236572265625, 0.509765625, 0.533294677734375, 0.55682373046875, 0.580352783203125, 0.6038818359375, 0.627410888671875, 0.65093994140625, 0.674468994140625, 0.697998046875, 0.721527099609375, 0.74505615234375, 0.768585205078125, 0.7921142578125, 0.815643310546875, 0.83917236328125, 0.862701416015625, 0.88623046875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 25.0, 49.0, 116.0, 221.0, 258.0, 200.0, 84.0, 34.0, 12.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.779558181762695, -6.461991310119629, -6.1444244384765625, -5.826857566833496, -5.509291172027588, -5.1917243003845215, -4.874157428741455, -4.556591033935547, -4.2390241622924805, -3.921457290649414, -3.6038906574249268, -3.2863237857818604, -2.968757152557373, -2.6511902809143066, -2.3336234092712402, -2.016056776046753, -1.6984896659851074, -1.3809229135513306, -1.0633561611175537, -0.7457892894744873, -0.42822253704071045, -0.1106557846069336, 0.2069110870361328, 0.5244777202606201, 0.8420445919036865, 1.1596113443374634, 1.4771780967712402, 1.7947449684143066, 2.112311840057373, 2.4298784732818604, 2.7474453449249268, 3.065011978149414, 3.3825788497924805, 3.700145721435547, 4.017712593078613, 4.33527946472168, 4.652845859527588, 4.970412731170654, 5.287979602813721, 5.605545997619629, 5.923112869262695, 6.240679740905762, 6.558246612548828, 6.8758134841918945, 7.193379878997803, 7.510946750640869, 7.8285136222839355, 8.146080017089844, 8.463647842407227, 8.781214714050293, 9.09878158569336, 9.416348457336426, 9.733915328979492, 10.051481246948242, 10.369049072265625, 10.686614990234375, 11.004181861877441, 11.321748733520508, 11.639315605163574, 11.95688247680664, 12.274449348449707, 12.592016220092773, 12.909582138061523, 13.22714900970459, 13.544715881347656]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 5.0, 8.0, 9.0, 12.0, 14.0, 14.0, 18.0, 21.0, 28.0, 28.0, 29.0, 34.0, 41.0, 35.0, 38.0, 65.0, 43.0, 47.0, 52.0, 48.0, 45.0, 47.0, 42.0, 35.0, 25.0, 30.0, 22.0, 29.0, 23.0, 21.0, 15.0, 16.0, 16.0, 6.0, 10.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5316033363342285, -2.4514083862304688, -2.371213436126709, -2.29101824760437, -2.2108232975006104, -2.1306283473968506, -2.050433397293091, -1.9702383279800415, -1.8900432586669922, -1.8098483085632324, -1.729653239250183, -1.6494582891464233, -1.569263219833374, -1.4890682697296143, -1.4088733196258545, -1.3286782503128052, -1.2484833002090454, -1.1682883501052856, -1.0880932807922363, -1.0078983306884766, -0.9277032613754272, -0.8475083112716675, -0.7673133015632629, -0.6871182918548584, -0.6069232821464539, -0.5267282724380493, -0.4465332627296448, -0.3663382828235626, -0.2861432731151581, -0.20594826340675354, -0.1257532835006714, -0.045558273792266846, 0.034636735916137695, 0.11483173817396164, 0.19502674043178558, 0.27522173523902893, 0.35541674494743347, 0.435611754655838, 0.5158067345619202, 0.5960017442703247, 0.6761967539787292, 0.7563917636871338, 0.8365867733955383, 0.9167817831039429, 0.9969767332077026, 1.077171802520752, 1.1573667526245117, 1.2375617027282715, 1.3177567720413208, 1.3979517221450806, 1.4781467914581299, 1.5583417415618896, 1.638536810874939, 1.7187317609786987, 1.798926830291748, 1.8791217803955078, 1.9593167304992676, 2.0395116806030273, 2.119706630706787, 2.199901819229126, 2.2800967693328857, 2.3602917194366455, 2.4404866695404053, 2.520681858062744, 2.600876808166504]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 8.0, 12.0, 15.0, 19.0, 42.0, 58.0, 114.0, 269.0, 558.0, 1111.0, 2569.0, 6361.0, 15645.0, 45621.0, 159862.0, 393199.0, 290149.0, 88282.0, 27079.0, 10097.0, 4143.0, 1754.0, 770.0, 363.0, 160.0, 88.0, 59.0, 34.0, 25.0, 13.0, 13.0, 11.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7685546875, -1.7110748291015625, -1.653594970703125, -1.5961151123046875, -1.53863525390625, -1.4811553955078125, -1.423675537109375, -1.3661956787109375, -1.3087158203125, -1.2512359619140625, -1.193756103515625, -1.1362762451171875, -1.07879638671875, -1.0213165283203125, -0.963836669921875, -0.9063568115234375, -0.848876953125, -0.7913970947265625, -0.733917236328125, -0.6764373779296875, -0.61895751953125, -0.5614776611328125, -0.503997802734375, -0.4465179443359375, -0.3890380859375, -0.3315582275390625, -0.274078369140625, -0.2165985107421875, -0.15911865234375, -0.1016387939453125, -0.044158935546875, 0.0133209228515625, 0.07080078125, 0.1282806396484375, 0.185760498046875, 0.2432403564453125, 0.30072021484375, 0.3582000732421875, 0.415679931640625, 0.4731597900390625, 0.5306396484375, 0.5881195068359375, 0.645599365234375, 0.7030792236328125, 0.76055908203125, 0.8180389404296875, 0.875518798828125, 0.9329986572265625, 0.990478515625, 1.0479583740234375, 1.105438232421875, 1.1629180908203125, 1.22039794921875, 1.2778778076171875, 1.335357666015625, 1.3928375244140625, 1.4503173828125, 1.5077972412109375, 1.565277099609375, 1.6227569580078125, 1.68023681640625, 1.7377166748046875, 1.795196533203125, 1.8526763916015625, 1.91015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 4.0, 13.0, 13.0, 19.0, 18.0, 26.0, 38.0, 46.0, 42.0, 56.0, 73.0, 55.0, 68.0, 79.0, 84.0, 75.0, 61.0, 47.0, 42.0, 37.0, 34.0, 20.0, 15.0, 10.0, 10.0, 7.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7109375, -0.6917800903320312, -0.6726226806640625, -0.6534652709960938, -0.634307861328125, -0.6151504516601562, -0.5959930419921875, -0.5768356323242188, -0.55767822265625, -0.5385208129882812, -0.5193634033203125, -0.5002059936523438, -0.481048583984375, -0.46189117431640625, -0.4427337646484375, -0.42357635498046875, -0.4044189453125, -0.38526153564453125, -0.3661041259765625, -0.34694671630859375, -0.327789306640625, -0.30863189697265625, -0.2894744873046875, -0.27031707763671875, -0.25115966796875, -0.23200225830078125, -0.2128448486328125, -0.19368743896484375, -0.174530029296875, -0.15537261962890625, -0.1362152099609375, -0.11705780029296875, -0.097900390625, -0.07874298095703125, -0.0595855712890625, -0.04042816162109375, -0.021270751953125, -0.00211334228515625, 0.0170440673828125, 0.03620147705078125, 0.05535888671875, 0.07451629638671875, 0.0936737060546875, 0.11283111572265625, 0.131988525390625, 0.15114593505859375, 0.1703033447265625, 0.18946075439453125, 0.2086181640625, 0.22777557373046875, 0.2469329833984375, 0.26609039306640625, 0.285247802734375, 0.30440521240234375, 0.3235626220703125, 0.34272003173828125, 0.36187744140625, 0.38103485107421875, 0.4001922607421875, 0.41934967041015625, 0.438507080078125, 0.45766448974609375, 0.4768218994140625, 0.49597930908203125, 0.51513671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 1.0, 6.0, 10.0, 16.0, 21.0, 24.0, 46.0, 71.0, 98.0, 111.0, 181.0, 277.0, 457.0, 808.0, 1397.0, 2646.0, 4919.0, 9654.0, 19627.0, 39174.0, 80513.0, 149826.0, 219867.0, 218039.0, 146309.0, 77597.0, 37982.0, 18739.0, 9240.0, 4869.0, 2573.0, 1361.0, 746.0, 451.0, 299.0, 188.0, 127.0, 95.0, 54.0, 42.0, 29.0, 26.0, 13.0, 14.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.95654296875, -0.9266281127929688, -0.8967132568359375, -0.8667984008789062, -0.836883544921875, -0.8069686889648438, -0.7770538330078125, -0.7471389770507812, -0.71722412109375, -0.6873092651367188, -0.6573944091796875, -0.6274795532226562, -0.597564697265625, -0.5676498413085938, -0.5377349853515625, -0.5078201293945312, -0.4779052734375, -0.44799041748046875, -0.4180755615234375, -0.38816070556640625, -0.358245849609375, -0.32833099365234375, -0.2984161376953125, -0.26850128173828125, -0.23858642578125, -0.20867156982421875, -0.1787567138671875, -0.14884185791015625, -0.118927001953125, -0.08901214599609375, -0.0590972900390625, -0.02918243408203125, 0.000732421875, 0.03064727783203125, 0.0605621337890625, 0.09047698974609375, 0.120391845703125, 0.15030670166015625, 0.1802215576171875, 0.21013641357421875, 0.24005126953125, 0.26996612548828125, 0.2998809814453125, 0.32979583740234375, 0.359710693359375, 0.38962554931640625, 0.4195404052734375, 0.44945526123046875, 0.4793701171875, 0.5092849731445312, 0.5391998291015625, 0.5691146850585938, 0.599029541015625, 0.6289443969726562, 0.6588592529296875, 0.6887741088867188, 0.71868896484375, 0.7486038208007812, 0.7785186767578125, 0.8084335327148438, 0.838348388671875, 0.8682632446289062, 0.8981781005859375, 0.9280929565429688, 0.9580078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 7.0, 14.0, 14.0, 15.0, 21.0, 27.0, 25.0, 31.0, 36.0, 32.0, 35.0, 49.0, 41.0, 49.0, 50.0, 40.0, 42.0, 32.0, 45.0, 45.0, 41.0, 34.0, 35.0, 42.0, 28.0, 34.0, 16.0, 21.0, 16.0, 16.0, 8.0, 10.0, 4.0, 5.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1123046875, -1.0794906616210938, -1.0466766357421875, -1.0138626098632812, -0.981048583984375, -0.9482345581054688, -0.9154205322265625, -0.8826065063476562, -0.84979248046875, -0.8169784545898438, -0.7841644287109375, -0.7513504028320312, -0.718536376953125, -0.6857223510742188, -0.6529083251953125, -0.6200942993164062, -0.5872802734375, -0.5544662475585938, -0.5216522216796875, -0.48883819580078125, -0.456024169921875, -0.42321014404296875, -0.3903961181640625, -0.35758209228515625, -0.32476806640625, -0.29195404052734375, -0.2591400146484375, -0.22632598876953125, -0.193511962890625, -0.16069793701171875, -0.1278839111328125, -0.09506988525390625, -0.062255859375, -0.02944183349609375, 0.0033721923828125, 0.03618621826171875, 0.069000244140625, 0.10181427001953125, 0.1346282958984375, 0.16744232177734375, 0.20025634765625, 0.23307037353515625, 0.2658843994140625, 0.29869842529296875, 0.331512451171875, 0.36432647705078125, 0.3971405029296875, 0.42995452880859375, 0.4627685546875, 0.49558258056640625, 0.5283966064453125, 0.5612106323242188, 0.594024658203125, 0.6268386840820312, 0.6596527099609375, 0.6924667358398438, 0.72528076171875, 0.7580947875976562, 0.7909088134765625, 0.8237228393554688, 0.856536865234375, 0.8893508911132812, 0.9221649169921875, 0.9549789428710938, 0.98779296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 6.0, 13.0, 23.0, 35.0, 55.0, 101.0, 172.0, 339.0, 553.0, 1076.0, 1974.0, 4392.0, 10150.0, 24976.0, 64860.0, 152992.0, 268912.0, 265493.0, 148350.0, 61739.0, 24286.0, 9710.0, 4131.0, 1966.0, 958.0, 529.0, 340.0, 159.0, 135.0, 39.0, 37.0, 17.0, 11.0, 13.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48095703125, -0.46543121337890625, -0.4499053955078125, -0.43437957763671875, -0.418853759765625, -0.40332794189453125, -0.3878021240234375, -0.37227630615234375, -0.35675048828125, -0.34122467041015625, -0.3256988525390625, -0.31017303466796875, -0.294647216796875, -0.27912139892578125, -0.2635955810546875, -0.24806976318359375, -0.2325439453125, -0.21701812744140625, -0.2014923095703125, -0.18596649169921875, -0.170440673828125, -0.15491485595703125, -0.1393890380859375, -0.12386322021484375, -0.10833740234375, -0.09281158447265625, -0.0772857666015625, -0.06175994873046875, -0.046234130859375, -0.03070831298828125, -0.0151824951171875, 0.00034332275390625, 0.015869140625, 0.03139495849609375, 0.0469207763671875, 0.06244659423828125, 0.077972412109375, 0.09349822998046875, 0.1090240478515625, 0.12454986572265625, 0.14007568359375, 0.15560150146484375, 0.1711273193359375, 0.18665313720703125, 0.202178955078125, 0.21770477294921875, 0.2332305908203125, 0.24875640869140625, 0.2642822265625, 0.27980804443359375, 0.2953338623046875, 0.31085968017578125, 0.326385498046875, 0.34191131591796875, 0.3574371337890625, 0.37296295166015625, 0.38848876953125, 0.40401458740234375, 0.4195404052734375, 0.43506622314453125, 0.450592041015625, 0.46611785888671875, 0.4816436767578125, 0.49716949462890625, 0.5126953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 4.0, 9.0, 10.0, 6.0, 18.0, 13.0, 17.0, 34.0, 33.0, 47.0, 55.0, 49.0, 71.0, 61.0, 76.0, 80.0, 66.0, 65.0, 51.0, 42.0, 45.0, 21.0, 23.0, 18.0, 15.0, 9.0, 15.0, 6.0, 7.0, 5.0, 8.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.61015510559082e-05, -6.381981074810028e-05, -6.153807044029236e-05, -5.9256330132484436e-05, -5.6974589824676514e-05, -5.469284951686859e-05, -5.241110920906067e-05, -5.0129368901252747e-05, -4.7847628593444824e-05, -4.55658882856369e-05, -4.328414797782898e-05, -4.100240767002106e-05, -3.8720667362213135e-05, -3.643892705440521e-05, -3.415718674659729e-05, -3.187544643878937e-05, -2.9593706130981445e-05, -2.7311965823173523e-05, -2.50302255153656e-05, -2.2748485207557678e-05, -2.0466744899749756e-05, -1.8185004591941833e-05, -1.590326428413391e-05, -1.3621523976325989e-05, -1.1339783668518066e-05, -9.058043360710144e-06, -6.776303052902222e-06, -4.494562745094299e-06, -2.212822437286377e-06, 6.891787052154541e-08, 2.3506581783294678e-06, 4.63239848613739e-06, 6.9141387939453125e-06, 9.195879101753235e-06, 1.1477619409561157e-05, 1.375935971736908e-05, 1.6041100025177002e-05, 1.8322840332984924e-05, 2.0604580640792847e-05, 2.288632094860077e-05, 2.516806125640869e-05, 2.7449801564216614e-05, 2.9731541872024536e-05, 3.201328217983246e-05, 3.429502248764038e-05, 3.65767627954483e-05, 3.8858503103256226e-05, 4.114024341106415e-05, 4.342198371887207e-05, 4.570372402667999e-05, 4.7985464334487915e-05, 5.026720464229584e-05, 5.254894495010376e-05, 5.483068525791168e-05, 5.7112425565719604e-05, 5.939416587352753e-05, 6.167590618133545e-05, 6.395764648914337e-05, 6.62393867969513e-05, 6.852112710475922e-05, 7.080286741256714e-05, 7.308460772037506e-05, 7.536634802818298e-05, 7.76480883359909e-05, 7.992982864379883e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 8.0, 13.0, 15.0, 30.0, 47.0, 54.0, 104.0, 172.0, 250.0, 444.0, 843.0, 1565.0, 3311.0, 7474.0, 17089.0, 40477.0, 94874.0, 191147.0, 265943.0, 217833.0, 116078.0, 51725.0, 21600.0, 9322.0, 4061.0, 1832.0, 974.0, 504.0, 307.0, 172.0, 108.0, 58.0, 47.0, 29.0, 20.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.5, -0.4867134094238281, -0.47342681884765625, -0.4601402282714844, -0.4468536376953125, -0.4335670471191406, -0.42028045654296875, -0.4069938659667969, -0.393707275390625, -0.3804206848144531, -0.36713409423828125, -0.3538475036621094, -0.3405609130859375, -0.3272743225097656, -0.31398773193359375, -0.3007011413574219, -0.28741455078125, -0.2741279602050781, -0.26084136962890625, -0.24755477905273438, -0.2342681884765625, -0.22098159790039062, -0.20769500732421875, -0.19440841674804688, -0.181121826171875, -0.16783523559570312, -0.15454864501953125, -0.14126205444335938, -0.1279754638671875, -0.11468887329101562, -0.10140228271484375, -0.08811569213867188, -0.0748291015625, -0.061542510986328125, -0.04825592041015625, -0.034969329833984375, -0.0216827392578125, -0.008396148681640625, 0.00489044189453125, 0.018177032470703125, 0.031463623046875, 0.044750213623046875, 0.05803680419921875, 0.07132339477539062, 0.0846099853515625, 0.09789657592773438, 0.11118316650390625, 0.12446975708007812, 0.13775634765625, 0.15104293823242188, 0.16432952880859375, 0.17761611938476562, 0.1909027099609375, 0.20418930053710938, 0.21747589111328125, 0.23076248168945312, 0.244049072265625, 0.2573356628417969, 0.27062225341796875, 0.2839088439941406, 0.2971954345703125, 0.3104820251464844, 0.32376861572265625, 0.3370552062988281, 0.350341796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 4.0, 10.0, 10.0, 8.0, 14.0, 13.0, 16.0, 23.0, 24.0, 37.0, 38.0, 41.0, 44.0, 48.0, 61.0, 64.0, 81.0, 56.0, 59.0, 47.0, 38.0, 36.0, 36.0, 25.0, 24.0, 29.0, 21.0, 23.0, 16.0, 15.0, 7.0, 4.0, 6.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.321044921875, -0.3105010986328125, -0.299957275390625, -0.2894134521484375, -0.27886962890625, -0.2683258056640625, -0.257781982421875, -0.2472381591796875, -0.2366943359375, -0.2261505126953125, -0.215606689453125, -0.2050628662109375, -0.19451904296875, -0.1839752197265625, -0.173431396484375, -0.1628875732421875, -0.15234375, -0.1417999267578125, -0.131256103515625, -0.1207122802734375, -0.11016845703125, -0.0996246337890625, -0.089080810546875, -0.0785369873046875, -0.0679931640625, -0.0574493408203125, -0.046905517578125, -0.0363616943359375, -0.02581787109375, -0.0152740478515625, -0.004730224609375, 0.0058135986328125, 0.016357421875, 0.0269012451171875, 0.037445068359375, 0.0479888916015625, 0.05853271484375, 0.0690765380859375, 0.079620361328125, 0.0901641845703125, 0.1007080078125, 0.1112518310546875, 0.121795654296875, 0.1323394775390625, 0.14288330078125, 0.1534271240234375, 0.163970947265625, 0.1745147705078125, 0.18505859375, 0.1956024169921875, 0.206146240234375, 0.2166900634765625, 0.22723388671875, 0.2377777099609375, 0.248321533203125, 0.2588653564453125, 0.2694091796875, 0.2799530029296875, 0.290496826171875, 0.3010406494140625, 0.31158447265625, 0.3221282958984375, 0.332672119140625, 0.3432159423828125, 0.353759765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 11.0, 11.0, 21.0, 32.0, 32.0, 49.0, 45.0, 59.0, 67.0, 80.0, 83.0, 78.0, 69.0, 61.0, 54.0, 45.0, 53.0, 35.0, 25.0, 19.0, 16.0, 11.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62399959564209, -2.5225133895874023, -2.4210269451141357, -2.3195407390594482, -2.2180545330047607, -2.116568088531494, -2.0150818824768066, -1.9135956764221191, -1.812109351158142, -1.710623025894165, -1.6091368198394775, -1.5076504945755005, -1.4061641693115234, -1.304677963256836, -1.2031916379928589, -1.1017053127288818, -1.0002191066741943, -0.8987328410148621, -0.7972465753555298, -0.6957602500915527, -0.5942739844322205, -0.4927877187728882, -0.39130139350891113, -0.28981512784957886, -0.18832886219024658, -0.08684258162975311, 0.014643698930740356, 0.11612999439239502, 0.2176162600517273, 0.31910252571105957, 0.4205888509750366, 0.5220751166343689, 0.6235613822937012, 0.7250476479530334, 0.8265339136123657, 0.9280202388763428, 1.0295064449310303, 1.1309927701950073, 1.2324790954589844, 1.3339653015136719, 1.435451626777649, 1.536937952041626, 1.6384241580963135, 1.7399104833602905, 1.8413968086242676, 1.942883014678955, 2.0443692207336426, 2.145855665206909, 2.2473418712615967, 2.348828077316284, 2.450314521789551, 2.5518007278442383, 2.653286933898926, 2.7547731399536133, 2.85625958442688, 2.9577457904815674, 3.059232234954834, 3.1607184410095215, 3.262204885482788, 3.3636910915374756, 3.465177297592163, 3.5666637420654297, 3.668149948120117, 3.7696361541748047, 3.871122360229492]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 9.0, 11.0, 5.0, 12.0, 11.0, 10.0, 19.0, 21.0, 16.0, 31.0, 29.0, 28.0, 47.0, 32.0, 47.0, 36.0, 39.0, 32.0, 37.0, 49.0, 31.0, 46.0, 38.0, 47.0, 42.0, 35.0, 26.0, 22.0, 27.0, 26.0, 29.0, 20.0, 7.0, 12.0, 11.0, 11.0, 9.0, 3.0, 6.0, 7.0, 4.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.8946542739868164, -2.8066117763519287, -2.718569278717041, -2.6305267810821533, -2.5424842834472656, -2.454441785812378, -2.3663992881774902, -2.2783567905426025, -2.190314292907715, -2.102271795272827, -2.0142292976379395, -1.9261868000030518, -1.838144302368164, -1.7501018047332764, -1.6620593070983887, -1.574016809463501, -1.4859743118286133, -1.3979318141937256, -1.309889316558838, -1.2218468189239502, -1.1338043212890625, -1.0457618236541748, -0.9577193260192871, -0.8696768283843994, -0.7816343307495117, -0.693591833114624, -0.6055493354797363, -0.5175068378448486, -0.42946434020996094, -0.34142184257507324, -0.25337934494018555, -0.16533684730529785, -0.07729458808898926, 0.010747909545898438, 0.09879040718078613, 0.18683290481567383, 0.2748754024505615, 0.3629179000854492, 0.4509603977203369, 0.5390028953552246, 0.6270453929901123, 0.715087890625, 0.8031303882598877, 0.8911728858947754, 0.9792153835296631, 1.0672578811645508, 1.1553003787994385, 1.2433428764343262, 1.3313853740692139, 1.4194278717041016, 1.5074703693389893, 1.595512866973877, 1.6835553646087646, 1.7715978622436523, 1.85964035987854, 1.9476828575134277, 2.0357253551483154, 2.123767852783203, 2.211810350418091, 2.2998528480529785, 2.387895345687866, 2.475937843322754, 2.5639803409576416, 2.6520228385925293, 2.740065336227417]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 9.0, 13.0, 15.0, 29.0, 19.0, 28.0, 52.0, 76.0, 157.0, 222.0, 408.0, 801.0, 1682.0, 4080.0, 10821.0, 32494.0, 113935.0, 498345.0, 1829978.0, 1307707.0, 286802.0, 71437.0, 21689.0, 7678.0, 3004.0, 1344.0, 655.0, 328.0, 188.0, 104.0, 63.0, 42.0, 23.0, 18.0, 8.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92626953125, -0.9017791748046875, -0.877288818359375, -0.8527984619140625, -0.82830810546875, -0.8038177490234375, -0.779327392578125, -0.7548370361328125, -0.7303466796875, -0.7058563232421875, -0.681365966796875, -0.6568756103515625, -0.63238525390625, -0.6078948974609375, -0.583404541015625, -0.5589141845703125, -0.534423828125, -0.5099334716796875, -0.485443115234375, -0.4609527587890625, -0.43646240234375, -0.4119720458984375, -0.387481689453125, -0.3629913330078125, -0.3385009765625, -0.3140106201171875, -0.289520263671875, -0.2650299072265625, -0.24053955078125, -0.2160491943359375, -0.191558837890625, -0.1670684814453125, -0.142578125, -0.1180877685546875, -0.093597412109375, -0.0691070556640625, -0.04461669921875, -0.0201263427734375, 0.004364013671875, 0.0288543701171875, 0.0533447265625, 0.0778350830078125, 0.102325439453125, 0.1268157958984375, 0.15130615234375, 0.1757965087890625, 0.200286865234375, 0.2247772216796875, 0.249267578125, 0.2737579345703125, 0.298248291015625, 0.3227386474609375, 0.34722900390625, 0.3717193603515625, 0.396209716796875, 0.4207000732421875, 0.4451904296875, 0.4696807861328125, 0.494171142578125, 0.5186614990234375, 0.54315185546875, 0.5676422119140625, 0.592132568359375, 0.6166229248046875, 0.64111328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 14.0, 12.0, 24.0, 24.0, 22.0, 26.0, 25.0, 32.0, 49.0, 43.0, 63.0, 67.0, 53.0, 53.0, 56.0, 60.0, 57.0, 48.0, 44.0, 37.0, 39.0, 38.0, 27.0, 16.0, 17.0, 11.0, 10.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55078125, -0.5349044799804688, -0.5190277099609375, -0.5031509399414062, -0.487274169921875, -0.47139739990234375, -0.4555206298828125, -0.43964385986328125, -0.42376708984375, -0.40789031982421875, -0.3920135498046875, -0.37613677978515625, -0.360260009765625, -0.34438323974609375, -0.3285064697265625, -0.31262969970703125, -0.2967529296875, -0.28087615966796875, -0.2649993896484375, -0.24912261962890625, -0.233245849609375, -0.21736907958984375, -0.2014923095703125, -0.18561553955078125, -0.16973876953125, -0.15386199951171875, -0.1379852294921875, -0.12210845947265625, -0.106231689453125, -0.09035491943359375, -0.0744781494140625, -0.05860137939453125, -0.042724609375, -0.02684783935546875, -0.0109710693359375, 0.00490570068359375, 0.020782470703125, 0.03665924072265625, 0.0525360107421875, 0.06841278076171875, 0.08428955078125, 0.10016632080078125, 0.1160430908203125, 0.13191986083984375, 0.147796630859375, 0.16367340087890625, 0.1795501708984375, 0.19542694091796875, 0.2113037109375, 0.22718048095703125, 0.2430572509765625, 0.25893402099609375, 0.274810791015625, 0.29068756103515625, 0.3065643310546875, 0.32244110107421875, 0.33831787109375, 0.35419464111328125, 0.3700714111328125, 0.38594818115234375, 0.401824951171875, 0.41770172119140625, 0.4335784912109375, 0.44945526123046875, 0.46533203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 12.0, 11.0, 30.0, 39.0, 68.0, 86.0, 157.0, 322.0, 719.0, 2073.0, 8033.0, 39754.0, 265349.0, 1743912.0, 1802255.0, 277872.0, 41617.0, 8178.0, 2206.0, 803.0, 311.0, 151.0, 100.0, 72.0, 42.0, 33.0, 11.0, 15.0, 6.0, 10.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.291015625, -1.2506866455078125, -1.210357666015625, -1.1700286865234375, -1.12969970703125, -1.0893707275390625, -1.049041748046875, -1.0087127685546875, -0.9683837890625, -0.9280548095703125, -0.887725830078125, -0.8473968505859375, -0.80706787109375, -0.7667388916015625, -0.726409912109375, -0.6860809326171875, -0.645751953125, -0.6054229736328125, -0.565093994140625, -0.5247650146484375, -0.48443603515625, -0.4441070556640625, -0.403778076171875, -0.3634490966796875, -0.3231201171875, -0.2827911376953125, -0.242462158203125, -0.2021331787109375, -0.16180419921875, -0.1214752197265625, -0.081146240234375, -0.0408172607421875, -0.00048828125, 0.0398406982421875, 0.080169677734375, 0.1204986572265625, 0.16082763671875, 0.2011566162109375, 0.241485595703125, 0.2818145751953125, 0.3221435546875, 0.3624725341796875, 0.402801513671875, 0.4431304931640625, 0.48345947265625, 0.5237884521484375, 0.564117431640625, 0.6044464111328125, 0.644775390625, 0.6851043701171875, 0.725433349609375, 0.7657623291015625, 0.80609130859375, 0.8464202880859375, 0.886749267578125, 0.9270782470703125, 0.9674072265625, 1.0077362060546875, 1.048065185546875, 1.0883941650390625, 1.12872314453125, 1.1690521240234375, 1.209381103515625, 1.2497100830078125, 1.2900390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 10.0, 11.0, 9.0, 22.0, 28.0, 44.0, 49.0, 59.0, 86.0, 92.0, 118.0, 148.0, 162.0, 243.0, 300.0, 313.0, 378.0, 335.0, 294.0, 291.0, 263.0, 201.0, 139.0, 114.0, 84.0, 56.0, 52.0, 41.0, 32.0, 19.0, 21.0, 11.0, 11.0, 9.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.673828125, -0.653900146484375, -0.63397216796875, -0.614044189453125, -0.5941162109375, -0.574188232421875, -0.55426025390625, -0.534332275390625, -0.514404296875, -0.494476318359375, -0.47454833984375, -0.454620361328125, -0.4346923828125, -0.414764404296875, -0.39483642578125, -0.374908447265625, -0.35498046875, -0.335052490234375, -0.31512451171875, -0.295196533203125, -0.2752685546875, -0.255340576171875, -0.23541259765625, -0.215484619140625, -0.195556640625, -0.175628662109375, -0.15570068359375, -0.135772705078125, -0.1158447265625, -0.095916748046875, -0.07598876953125, -0.056060791015625, -0.0361328125, -0.016204833984375, 0.00372314453125, 0.023651123046875, 0.0435791015625, 0.063507080078125, 0.08343505859375, 0.103363037109375, 0.123291015625, 0.143218994140625, 0.16314697265625, 0.183074951171875, 0.2030029296875, 0.222930908203125, 0.24285888671875, 0.262786865234375, 0.28271484375, 0.302642822265625, 0.32257080078125, 0.342498779296875, 0.3624267578125, 0.382354736328125, 0.40228271484375, 0.422210693359375, 0.442138671875, 0.462066650390625, 0.48199462890625, 0.501922607421875, 0.5218505859375, 0.541778564453125, 0.56170654296875, 0.581634521484375, 0.6015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 9.0, 7.0, 18.0, 39.0, 53.0, 70.0, 95.0, 121.0, 137.0, 128.0, 112.0, 100.0, 54.0, 33.0, 23.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.6520538330078125, -7.473014831542969, -7.293975830078125, -7.114936828613281, -6.9358978271484375, -6.756858825683594, -6.57781982421875, -6.398780822753906, -6.2197418212890625, -6.040702819824219, -5.861663818359375, -5.682624816894531, -5.5035858154296875, -5.324546813964844, -5.1455078125, -4.966468811035156, -4.7874298095703125, -4.608390808105469, -4.429351806640625, -4.250312805175781, -4.0712738037109375, -3.8922348022460938, -3.71319580078125, -3.5341567993164062, -3.3551173210144043, -3.1760783195495605, -2.997039318084717, -2.818000316619873, -2.6389613151550293, -2.4599223136901855, -2.280883312225342, -2.101844310760498, -1.9228055477142334, -1.7437665462493896, -1.564727544784546, -1.3856885433197021, -1.2066495418548584, -1.0276105403900146, -0.8485714197158813, -0.6695324182510376, -0.49049341678619385, -0.3114544153213501, -0.13241538405418396, 0.04662364721298218, 0.22566264867782593, 0.4047016501426697, 0.5837407112121582, 0.762779712677002, 0.9418187141418457, 1.1208577156066895, 1.2998967170715332, 1.478935718536377, 1.6579747200012207, 1.8370137214660645, 2.016052722930908, 2.195091724395752, 2.3741307258605957, 2.5531697273254395, 2.732208728790283, 2.911247730255127, 3.0902867317199707, 3.2693257331848145, 3.448364734649658, 3.627403736114502, 3.806442975997925]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 6.0, 12.0, 16.0, 18.0, 23.0, 24.0, 25.0, 30.0, 27.0, 38.0, 36.0, 41.0, 28.0, 46.0, 39.0, 41.0, 40.0, 45.0, 34.0, 42.0, 31.0, 35.0, 32.0, 36.0, 36.0, 21.0, 26.0, 23.0, 18.0, 17.0, 19.0, 12.0, 6.0, 13.0, 7.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.2632663249969482, -2.1969923973083496, -2.130718231201172, -2.0644443035125732, -1.9981701374053955, -1.9318960905075073, -1.8656220436096191, -1.7993481159210205, -1.7330739498138428, -1.6667999029159546, -1.6005258560180664, -1.5342518091201782, -1.46797776222229, -1.4017037153244019, -1.3354296684265137, -1.269155740737915, -1.2028816938400269, -1.1366076469421387, -1.0703336000442505, -1.0040595531463623, -0.9377855062484741, -0.8715114593505859, -0.8052374720573425, -0.7389634251594543, -0.6726893782615662, -0.606415331363678, -0.5401412844657898, -0.473867267370224, -0.4075932204723358, -0.34131917357444763, -0.27504515647888184, -0.20877110958099365, -0.14249706268310547, -0.07622302323579788, -0.009948983788490295, 0.056325048208236694, 0.12259909510612488, 0.18887314200401306, 0.25514715909957886, 0.32142120599746704, 0.3876952528953552, 0.4539692997932434, 0.5202433466911316, 0.586517333984375, 0.6527913808822632, 0.7190654277801514, 0.7853394746780396, 0.8516135215759277, 0.9178875684738159, 0.9841616153717041, 1.0504356622695923, 1.1167097091674805, 1.1829837560653687, 1.2492578029632568, 1.3155317306518555, 1.3818058967590332, 1.4480798244476318, 1.51435387134552, 1.5806279182434082, 1.6469019651412964, 1.7131760120391846, 1.7794500589370728, 1.845724105834961, 1.9119980335235596, 1.9782721996307373]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 14.0, 15.0, 19.0, 34.0, 52.0, 58.0, 101.0, 196.0, 339.0, 708.0, 1502.0, 3284.0, 7733.0, 18639.0, 45149.0, 109971.0, 241080.0, 306035.0, 181803.0, 77164.0, 31631.0, 13074.0, 5351.0, 2353.0, 1028.0, 513.0, 298.0, 146.0, 90.0, 51.0, 33.0, 24.0, 21.0, 11.0, 8.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.234375, -1.193634033203125, -1.15289306640625, -1.112152099609375, -1.0714111328125, -1.030670166015625, -0.98992919921875, -0.949188232421875, -0.908447265625, -0.867706298828125, -0.82696533203125, -0.786224365234375, -0.7454833984375, -0.704742431640625, -0.66400146484375, -0.623260498046875, -0.58251953125, -0.541778564453125, -0.50103759765625, -0.460296630859375, -0.4195556640625, -0.378814697265625, -0.33807373046875, -0.297332763671875, -0.256591796875, -0.215850830078125, -0.17510986328125, -0.134368896484375, -0.0936279296875, -0.052886962890625, -0.01214599609375, 0.028594970703125, 0.0693359375, 0.110076904296875, 0.15081787109375, 0.191558837890625, 0.2322998046875, 0.273040771484375, 0.31378173828125, 0.354522705078125, 0.395263671875, 0.436004638671875, 0.47674560546875, 0.517486572265625, 0.5582275390625, 0.598968505859375, 0.63970947265625, 0.680450439453125, 0.72119140625, 0.761932373046875, 0.80267333984375, 0.843414306640625, 0.8841552734375, 0.924896240234375, 0.96563720703125, 1.006378173828125, 1.047119140625, 1.087860107421875, 1.12860107421875, 1.169342041015625, 1.2100830078125, 1.250823974609375, 1.29156494140625, 1.332305908203125, 1.373046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 8.0, 5.0, 13.0, 12.0, 21.0, 21.0, 21.0, 31.0, 40.0, 34.0, 48.0, 47.0, 54.0, 59.0, 64.0, 61.0, 44.0, 62.0, 48.0, 61.0, 43.0, 27.0, 29.0, 30.0, 29.0, 28.0, 15.0, 4.0, 9.0, 8.0, 8.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5252456665039062, -0.5099639892578125, -0.49468231201171875, -0.479400634765625, -0.46411895751953125, -0.4488372802734375, -0.43355560302734375, -0.41827392578125, -0.40299224853515625, -0.3877105712890625, -0.37242889404296875, -0.357147216796875, -0.34186553955078125, -0.3265838623046875, -0.31130218505859375, -0.2960205078125, -0.28073883056640625, -0.2654571533203125, -0.25017547607421875, -0.234893798828125, -0.21961212158203125, -0.2043304443359375, -0.18904876708984375, -0.17376708984375, -0.15848541259765625, -0.1432037353515625, -0.12792205810546875, -0.112640380859375, -0.09735870361328125, -0.0820770263671875, -0.06679534912109375, -0.051513671875, -0.03623199462890625, -0.0209503173828125, -0.00566864013671875, 0.009613037109375, 0.02489471435546875, 0.0401763916015625, 0.05545806884765625, 0.07073974609375, 0.08602142333984375, 0.1013031005859375, 0.11658477783203125, 0.131866455078125, 0.14714813232421875, 0.1624298095703125, 0.17771148681640625, 0.1929931640625, 0.20827484130859375, 0.2235565185546875, 0.23883819580078125, 0.254119873046875, 0.26940155029296875, 0.2846832275390625, 0.29996490478515625, 0.31524658203125, 0.33052825927734375, 0.3458099365234375, 0.36109161376953125, 0.376373291015625, 0.39165496826171875, 0.4069366455078125, 0.42221832275390625, 0.4375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 10.0, 6.0, 9.0, 7.0, 10.0, 17.0, 22.0, 36.0, 56.0, 112.0, 221.0, 449.0, 1174.0, 2768.0, 6599.0, 15448.0, 35676.0, 79341.0, 163264.0, 258986.0, 237325.0, 135000.0, 63086.0, 28110.0, 11878.0, 5102.0, 2109.0, 883.0, 370.0, 176.0, 95.0, 58.0, 31.0, 22.0, 14.0, 13.0, 13.0, 12.0, 6.0, 6.0, 6.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.162109375, -1.1256256103515625, -1.089141845703125, -1.0526580810546875, -1.01617431640625, -0.9796905517578125, -0.943206787109375, -0.9067230224609375, -0.8702392578125, -0.8337554931640625, -0.797271728515625, -0.7607879638671875, -0.72430419921875, -0.6878204345703125, -0.651336669921875, -0.6148529052734375, -0.578369140625, -0.5418853759765625, -0.505401611328125, -0.4689178466796875, -0.43243408203125, -0.3959503173828125, -0.359466552734375, -0.3229827880859375, -0.2864990234375, -0.2500152587890625, -0.213531494140625, -0.1770477294921875, -0.14056396484375, -0.1040802001953125, -0.067596435546875, -0.0311126708984375, 0.00537109375, 0.0418548583984375, 0.078338623046875, 0.1148223876953125, 0.15130615234375, 0.1877899169921875, 0.224273681640625, 0.2607574462890625, 0.2972412109375, 0.3337249755859375, 0.370208740234375, 0.4066925048828125, 0.44317626953125, 0.4796600341796875, 0.516143798828125, 0.5526275634765625, 0.589111328125, 0.6255950927734375, 0.662078857421875, 0.6985626220703125, 0.73504638671875, 0.7715301513671875, 0.808013916015625, 0.8444976806640625, 0.8809814453125, 0.9174652099609375, 0.953948974609375, 0.9904327392578125, 1.02691650390625, 1.0634002685546875, 1.099884033203125, 1.1363677978515625, 1.1728515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 4.0, 6.0, 8.0, 10.0, 15.0, 8.0, 11.0, 10.0, 19.0, 21.0, 18.0, 26.0, 23.0, 34.0, 42.0, 33.0, 43.0, 50.0, 36.0, 59.0, 43.0, 43.0, 45.0, 41.0, 33.0, 47.0, 42.0, 34.0, 25.0, 34.0, 17.0, 10.0, 23.0, 16.0, 13.0, 9.0, 9.0, 11.0, 4.0, 4.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0195770263671875, -0.986419677734375, -0.9532623291015625, -0.92010498046875, -0.8869476318359375, -0.853790283203125, -0.8206329345703125, -0.7874755859375, -0.7543182373046875, -0.721160888671875, -0.6880035400390625, -0.65484619140625, -0.6216888427734375, -0.588531494140625, -0.5553741455078125, -0.522216796875, -0.4890594482421875, -0.455902099609375, -0.4227447509765625, -0.38958740234375, -0.3564300537109375, -0.323272705078125, -0.2901153564453125, -0.2569580078125, -0.2238006591796875, -0.190643310546875, -0.1574859619140625, -0.12432861328125, -0.0911712646484375, -0.058013916015625, -0.0248565673828125, 0.00830078125, 0.0414581298828125, 0.074615478515625, 0.1077728271484375, 0.14093017578125, 0.1740875244140625, 0.207244873046875, 0.2404022216796875, 0.2735595703125, 0.3067169189453125, 0.339874267578125, 0.3730316162109375, 0.40618896484375, 0.4393463134765625, 0.472503662109375, 0.5056610107421875, 0.538818359375, 0.5719757080078125, 0.605133056640625, 0.6382904052734375, 0.67144775390625, 0.7046051025390625, 0.737762451171875, 0.7709197998046875, 0.8040771484375, 0.8372344970703125, 0.870391845703125, 0.9035491943359375, 0.93670654296875, 0.9698638916015625, 1.003021240234375, 1.0361785888671875, 1.0693359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 14.0, 7.0, 22.0, 48.0, 43.0, 68.0, 109.0, 154.0, 244.0, 373.0, 584.0, 925.0, 1629.0, 2526.0, 4401.0, 7889.0, 14806.0, 27719.0, 50989.0, 88406.0, 136266.0, 174265.0, 177530.0, 142663.0, 94670.0, 55361.0, 30290.0, 15979.0, 8620.0, 4753.0, 2795.0, 1566.0, 999.0, 610.0, 439.0, 285.0, 179.0, 102.0, 77.0, 42.0, 31.0, 16.0, 20.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0], "bins": [-0.309814453125, -0.30072021484375, -0.2916259765625, -0.28253173828125, -0.2734375, -0.26434326171875, -0.2552490234375, -0.24615478515625, -0.237060546875, -0.22796630859375, -0.2188720703125, -0.20977783203125, -0.20068359375, -0.19158935546875, -0.1824951171875, -0.17340087890625, -0.164306640625, -0.15521240234375, -0.1461181640625, -0.13702392578125, -0.1279296875, -0.11883544921875, -0.1097412109375, -0.10064697265625, -0.091552734375, -0.08245849609375, -0.0733642578125, -0.06427001953125, -0.05517578125, -0.04608154296875, -0.0369873046875, -0.02789306640625, -0.018798828125, -0.00970458984375, -0.0006103515625, 0.00848388671875, 0.017578125, 0.02667236328125, 0.0357666015625, 0.04486083984375, 0.053955078125, 0.06304931640625, 0.0721435546875, 0.08123779296875, 0.09033203125, 0.09942626953125, 0.1085205078125, 0.11761474609375, 0.126708984375, 0.13580322265625, 0.1448974609375, 0.15399169921875, 0.1630859375, 0.17218017578125, 0.1812744140625, 0.19036865234375, 0.199462890625, 0.20855712890625, 0.2176513671875, 0.22674560546875, 0.23583984375, 0.24493408203125, 0.2540283203125, 0.26312255859375, 0.272216796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 0.0, 4.0, 4.0, 9.0, 9.0, 13.0, 18.0, 32.0, 35.0, 43.0, 71.0, 86.0, 101.0, 111.0, 102.0, 94.0, 80.0, 56.0, 48.0, 28.0, 19.0, 9.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012230873107910156, -0.00011885538697242737, -0.00011540204286575317, -0.00011194869875907898, -0.00010849535465240479, -0.00010504201054573059, -0.0001015886664390564, -9.81353223323822e-05, -9.468197822570801e-05, -9.122863411903381e-05, -8.777529001235962e-05, -8.432194590568542e-05, -8.086860179901123e-05, -7.741525769233704e-05, -7.396191358566284e-05, -7.050856947898865e-05, -6.705522537231445e-05, -6.360188126564026e-05, -6.0148537158966064e-05, -5.669519305229187e-05, -5.3241848945617676e-05, -4.978850483894348e-05, -4.633516073226929e-05, -4.288181662559509e-05, -3.94284725189209e-05, -3.5975128412246704e-05, -3.252178430557251e-05, -2.9068440198898315e-05, -2.561509609222412e-05, -2.2161751985549927e-05, -1.8708407878875732e-05, -1.5255063772201538e-05, -1.1801719665527344e-05, -8.34837555885315e-06, -4.895031452178955e-06, -1.4416873455047607e-06, 2.0116567611694336e-06, 5.465000867843628e-06, 8.918344974517822e-06, 1.2371689081192017e-05, 1.582503318786621e-05, 1.9278377294540405e-05, 2.27317214012146e-05, 2.6185065507888794e-05, 2.9638409614562988e-05, 3.309175372123718e-05, 3.654509782791138e-05, 3.999844193458557e-05, 4.3451786041259766e-05, 4.690513014793396e-05, 5.0358474254608154e-05, 5.381181836128235e-05, 5.726516246795654e-05, 6.071850657463074e-05, 6.417185068130493e-05, 6.762519478797913e-05, 7.107853889465332e-05, 7.453188300132751e-05, 7.798522710800171e-05, 8.14385712146759e-05, 8.48919153213501e-05, 8.834525942802429e-05, 9.179860353469849e-05, 9.525194764137268e-05, 9.870529174804688e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 13.0, 30.0, 42.0, 61.0, 113.0, 190.0, 319.0, 559.0, 1112.0, 2150.0, 4234.0, 9079.0, 20924.0, 48609.0, 104120.0, 184211.0, 237816.0, 203582.0, 123799.0, 59578.0, 26027.0, 11378.0, 5060.0, 2563.0, 1329.0, 717.0, 408.0, 207.0, 133.0, 72.0, 35.0, 27.0, 14.0, 10.0, 10.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36669921875, -0.356109619140625, -0.34552001953125, -0.334930419921875, -0.3243408203125, -0.313751220703125, -0.30316162109375, -0.292572021484375, -0.281982421875, -0.271392822265625, -0.26080322265625, -0.250213623046875, -0.2396240234375, -0.229034423828125, -0.21844482421875, -0.207855224609375, -0.197265625, -0.186676025390625, -0.17608642578125, -0.165496826171875, -0.1549072265625, -0.144317626953125, -0.13372802734375, -0.123138427734375, -0.112548828125, -0.101959228515625, -0.09136962890625, -0.080780029296875, -0.0701904296875, -0.059600830078125, -0.04901123046875, -0.038421630859375, -0.02783203125, -0.017242431640625, -0.00665283203125, 0.003936767578125, 0.0145263671875, 0.025115966796875, 0.03570556640625, 0.046295166015625, 0.056884765625, 0.067474365234375, 0.07806396484375, 0.088653564453125, 0.0992431640625, 0.109832763671875, 0.12042236328125, 0.131011962890625, 0.1416015625, 0.152191162109375, 0.16278076171875, 0.173370361328125, 0.1839599609375, 0.194549560546875, 0.20513916015625, 0.215728759765625, 0.226318359375, 0.236907958984375, 0.24749755859375, 0.258087158203125, 0.2686767578125, 0.279266357421875, 0.28985595703125, 0.300445556640625, 0.31103515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 3.0, 2.0, 5.0, 12.0, 7.0, 16.0, 17.0, 15.0, 26.0, 30.0, 28.0, 39.0, 39.0, 48.0, 45.0, 48.0, 46.0, 63.0, 55.0, 48.0, 65.0, 46.0, 41.0, 35.0, 21.0, 42.0, 29.0, 21.0, 19.0, 28.0, 12.0, 11.0, 11.0, 10.0, 2.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.283935546875, -0.2748870849609375, -0.265838623046875, -0.2567901611328125, -0.24774169921875, -0.2386932373046875, -0.229644775390625, -0.2205963134765625, -0.2115478515625, -0.2024993896484375, -0.193450927734375, -0.1844024658203125, -0.17535400390625, -0.1663055419921875, -0.157257080078125, -0.1482086181640625, -0.13916015625, -0.1301116943359375, -0.121063232421875, -0.1120147705078125, -0.10296630859375, -0.0939178466796875, -0.084869384765625, -0.0758209228515625, -0.0667724609375, -0.0577239990234375, -0.048675537109375, -0.0396270751953125, -0.03057861328125, -0.0215301513671875, -0.012481689453125, -0.0034332275390625, 0.005615234375, 0.0146636962890625, 0.023712158203125, 0.0327606201171875, 0.04180908203125, 0.0508575439453125, 0.059906005859375, 0.0689544677734375, 0.0780029296875, 0.0870513916015625, 0.096099853515625, 0.1051483154296875, 0.11419677734375, 0.1232452392578125, 0.132293701171875, 0.1413421630859375, 0.150390625, 0.1594390869140625, 0.168487548828125, 0.1775360107421875, 0.18658447265625, 0.1956329345703125, 0.204681396484375, 0.2137298583984375, 0.2227783203125, 0.2318267822265625, 0.240875244140625, 0.2499237060546875, 0.25897216796875, 0.2680206298828125, 0.277069091796875, 0.2861175537109375, 0.295166015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 8.0, 15.0, 16.0, 34.0, 43.0, 63.0, 77.0, 90.0, 89.0, 112.0, 102.0, 100.0, 75.0, 61.0, 44.0, 37.0, 14.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.326821804046631, -7.169806957244873, -7.012792587280273, -6.855777740478516, -6.698762893676758, -6.541748046875, -6.384733200073242, -6.227718830108643, -6.070703983306885, -5.913689136505127, -5.756674766540527, -5.5996599197387695, -5.442645072937012, -5.285630226135254, -5.128615379333496, -4.9716010093688965, -4.814586162567139, -4.657571315765381, -4.500556945800781, -4.343542098999023, -4.186527252197266, -4.029512405395508, -3.872497797012329, -3.7154831886291504, -3.5584683418273926, -3.4014534950256348, -3.244438886642456, -3.0874242782592773, -2.9304094314575195, -2.7733945846557617, -2.616379976272583, -2.4593653678894043, -2.3023500442504883, -2.1453351974487305, -1.9883205890655518, -1.8313058614730835, -1.6742911338806152, -1.517276406288147, -1.3602616786956787, -1.2032469511032104, -1.0462322235107422, -0.8892174959182739, -0.7322027683258057, -0.5751880407333374, -0.41817331314086914, -0.2611585855484009, -0.10414385795593262, 0.052870869636535645, 0.2098855972290039, 0.36690032482147217, 0.5239150524139404, 0.6809297800064087, 0.837944507598877, 0.9949592351913452, 1.1519739627838135, 1.3089886903762817, 1.46600341796875, 1.6230181455612183, 1.7800328731536865, 1.9370476007461548, 2.094062328338623, 2.251077175140381, 2.4080917835235596, 2.5651063919067383, 2.722121238708496]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 9.0, 3.0, 5.0, 7.0, 6.0, 9.0, 6.0, 9.0, 12.0, 12.0, 18.0, 23.0, 28.0, 23.0, 27.0, 30.0, 37.0, 38.0, 43.0, 43.0, 34.0, 55.0, 36.0, 36.0, 36.0, 51.0, 36.0, 30.0, 33.0, 35.0, 23.0, 35.0, 29.0, 20.0, 22.0, 33.0, 18.0, 15.0, 10.0, 11.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.1466610431671143, -3.0448029041290283, -2.9429447650909424, -2.8410866260528564, -2.7392284870147705, -2.6373703479766846, -2.5355124473571777, -2.433654308319092, -2.331796169281006, -2.22993803024292, -2.128079891204834, -2.026221752166748, -1.924363613128662, -1.8225054740905762, -1.7206474542617798, -1.6187893152236938, -1.5169310569763184, -1.4150729179382324, -1.3132147789001465, -1.2113566398620605, -1.1094985008239746, -1.0076403617858887, -0.9057823419570923, -0.8039242029190063, -0.7020660638809204, -0.6002079248428345, -0.4983498156070709, -0.3964917063713074, -0.29463356733322144, -0.1927754282951355, -0.09091734886169434, 0.010940790176391602, 0.11279916763305664, 0.21465729176998138, 0.31651541590690613, 0.4183735251426697, 0.5202316641807556, 0.6220898032188416, 0.7239478826522827, 0.8258060216903687, 0.9276641607284546, 1.0295222997665405, 1.1313804388046265, 1.2332384586334229, 1.3350965976715088, 1.4369547367095947, 1.5388128757476807, 1.6406710147857666, 1.7425291538238525, 1.8443872928619385, 1.9462454319000244, 2.0481035709381104, 2.1499617099761963, 2.2518198490142822, 2.353677749633789, 2.455535888671875, 2.557394027709961, 2.659252166748047, 2.761110305786133, 2.8629684448242188, 2.9648265838623047, 3.0666847229003906, 3.1685428619384766, 3.2704010009765625, 3.3722591400146484]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 8.0, 5.0, 9.0, 11.0, 8.0, 24.0, 33.0, 44.0, 69.0, 101.0, 143.0, 217.0, 359.0, 651.0, 1276.0, 2731.0, 5906.0, 14426.0, 39253.0, 128096.0, 534715.0, 1802942.0, 1248449.0, 291359.0, 78021.0, 26456.0, 10344.0, 4314.0, 2084.0, 971.0, 568.0, 272.0, 154.0, 99.0, 53.0, 40.0, 21.0, 14.0, 7.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.80078125, -0.7763671875, -0.751953125, -0.7275390625, -0.703125, -0.6787109375, -0.654296875, -0.6298828125, -0.60546875, -0.5810546875, -0.556640625, -0.5322265625, -0.5078125, -0.4833984375, -0.458984375, -0.4345703125, -0.41015625, -0.3857421875, -0.361328125, -0.3369140625, -0.3125, -0.2880859375, -0.263671875, -0.2392578125, -0.21484375, -0.1904296875, -0.166015625, -0.1416015625, -0.1171875, -0.0927734375, -0.068359375, -0.0439453125, -0.01953125, 0.0048828125, 0.029296875, 0.0537109375, 0.078125, 0.1025390625, 0.126953125, 0.1513671875, 0.17578125, 0.2001953125, 0.224609375, 0.2490234375, 0.2734375, 0.2978515625, 0.322265625, 0.3466796875, 0.37109375, 0.3955078125, 0.419921875, 0.4443359375, 0.46875, 0.4931640625, 0.517578125, 0.5419921875, 0.56640625, 0.5908203125, 0.615234375, 0.6396484375, 0.6640625, 0.6884765625, 0.712890625, 0.7373046875, 0.76171875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 11.0, 10.0, 21.0, 19.0, 21.0, 21.0, 40.0, 28.0, 41.0, 36.0, 53.0, 63.0, 72.0, 63.0, 57.0, 54.0, 50.0, 54.0, 47.0, 59.0, 40.0, 25.0, 28.0, 13.0, 11.0, 16.0, 13.0, 8.0, 4.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.5994873046875, -0.582275390625, -0.5650634765625, -0.5478515625, -0.5306396484375, -0.513427734375, -0.4962158203125, -0.47900390625, -0.4617919921875, -0.444580078125, -0.4273681640625, -0.41015625, -0.3929443359375, -0.375732421875, -0.3585205078125, -0.34130859375, -0.3240966796875, -0.306884765625, -0.2896728515625, -0.2724609375, -0.2552490234375, -0.238037109375, -0.2208251953125, -0.20361328125, -0.1864013671875, -0.169189453125, -0.1519775390625, -0.134765625, -0.1175537109375, -0.100341796875, -0.0831298828125, -0.06591796875, -0.0487060546875, -0.031494140625, -0.0142822265625, 0.0029296875, 0.0201416015625, 0.037353515625, 0.0545654296875, 0.07177734375, 0.0889892578125, 0.106201171875, 0.1234130859375, 0.140625, 0.1578369140625, 0.175048828125, 0.1922607421875, 0.20947265625, 0.2266845703125, 0.243896484375, 0.2611083984375, 0.2783203125, 0.2955322265625, 0.312744140625, 0.3299560546875, 0.34716796875, 0.3643798828125, 0.381591796875, 0.3988037109375, 0.416015625, 0.4332275390625, 0.450439453125, 0.4676513671875, 0.48486328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 9.0, 8.0, 13.0, 23.0, 33.0, 48.0, 63.0, 155.0, 263.0, 554.0, 1560.0, 6115.0, 31325.0, 212412.0, 1605767.0, 1994807.0, 289612.0, 40599.0, 7565.0, 1996.0, 666.0, 310.0, 128.0, 92.0, 56.0, 39.0, 15.0, 14.0, 9.0, 11.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3115234375, -1.269317626953125, -1.22711181640625, -1.184906005859375, -1.1427001953125, -1.100494384765625, -1.05828857421875, -1.016082763671875, -0.973876953125, -0.931671142578125, -0.88946533203125, -0.847259521484375, -0.8050537109375, -0.762847900390625, -0.72064208984375, -0.678436279296875, -0.63623046875, -0.594024658203125, -0.55181884765625, -0.509613037109375, -0.4674072265625, -0.425201416015625, -0.38299560546875, -0.340789794921875, -0.298583984375, -0.256378173828125, -0.21417236328125, -0.171966552734375, -0.1297607421875, -0.087554931640625, -0.04534912109375, -0.003143310546875, 0.0390625, 0.081268310546875, 0.12347412109375, 0.165679931640625, 0.2078857421875, 0.250091552734375, 0.29229736328125, 0.334503173828125, 0.376708984375, 0.418914794921875, 0.46112060546875, 0.503326416015625, 0.5455322265625, 0.587738037109375, 0.62994384765625, 0.672149658203125, 0.71435546875, 0.756561279296875, 0.79876708984375, 0.840972900390625, 0.8831787109375, 0.925384521484375, 0.96759033203125, 1.009796142578125, 1.052001953125, 1.094207763671875, 1.13641357421875, 1.178619384765625, 1.2208251953125, 1.263031005859375, 1.30523681640625, 1.347442626953125, 1.3896484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 4.0, 12.0, 14.0, 20.0, 30.0, 37.0, 51.0, 62.0, 95.0, 110.0, 153.0, 212.0, 272.0, 310.0, 328.0, 397.0, 372.0, 299.0, 270.0, 239.0, 188.0, 147.0, 118.0, 92.0, 50.0, 51.0, 41.0, 25.0, 19.0, 12.0, 8.0, 5.0, 4.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7353515625, -0.7135467529296875, -0.691741943359375, -0.6699371337890625, -0.64813232421875, -0.6263275146484375, -0.604522705078125, -0.5827178955078125, -0.5609130859375, -0.5391082763671875, -0.517303466796875, -0.4954986572265625, -0.47369384765625, -0.4518890380859375, -0.430084228515625, -0.4082794189453125, -0.386474609375, -0.3646697998046875, -0.342864990234375, -0.3210601806640625, -0.29925537109375, -0.2774505615234375, -0.255645751953125, -0.2338409423828125, -0.2120361328125, -0.1902313232421875, -0.168426513671875, -0.1466217041015625, -0.12481689453125, -0.1030120849609375, -0.081207275390625, -0.0594024658203125, -0.03759765625, -0.0157928466796875, 0.006011962890625, 0.0278167724609375, 0.04962158203125, 0.0714263916015625, 0.093231201171875, 0.1150360107421875, 0.1368408203125, 0.1586456298828125, 0.180450439453125, 0.2022552490234375, 0.22406005859375, 0.2458648681640625, 0.267669677734375, 0.2894744873046875, 0.311279296875, 0.3330841064453125, 0.354888916015625, 0.3766937255859375, 0.39849853515625, 0.4203033447265625, 0.442108154296875, 0.4639129638671875, 0.4857177734375, 0.5075225830078125, 0.529327392578125, 0.5511322021484375, 0.57293701171875, 0.5947418212890625, 0.616546630859375, 0.6383514404296875, 0.66015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 7.0, 20.0, 36.0, 68.0, 93.0, 128.0, 129.0, 126.0, 133.0, 88.0, 54.0, 55.0, 22.0, 22.0, 11.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.044299125671387, -8.860620498657227, -8.676941871643066, -8.493263244628906, -8.309584617614746, -8.125905990600586, -7.942227363586426, -7.758548736572266, -7.5748701095581055, -7.391191482543945, -7.207512855529785, -7.023834228515625, -6.840155601501465, -6.656476974487305, -6.4727983474731445, -6.289119720458984, -6.105441093444824, -5.921762466430664, -5.738083839416504, -5.554405212402344, -5.370726585388184, -5.187047958374023, -5.003369331359863, -4.819690704345703, -4.636012554168701, -4.452333927154541, -4.268655300140381, -4.084976673126221, -3.9012980461120605, -3.7176194190979004, -3.5339407920837402, -3.35026216506958, -3.16658353805542, -2.9829049110412598, -2.7992262840270996, -2.6155476570129395, -2.4318690299987793, -2.248190402984619, -2.064511775970459, -1.8808332681655884, -1.6971546411514282, -1.513476014137268, -1.329797387123108, -1.1461188793182373, -0.9624401926994324, -0.7787615656852722, -0.5950829982757568, -0.4114043712615967, -0.22772574424743652, -0.04404713213443756, 0.1396314799785614, 0.32331007719039917, 0.5069887042045593, 0.6906673312187195, 0.8743458986282349, 1.058024525642395, 1.2417031526565552, 1.4253817796707153, 1.6090604066848755, 1.792738914489746, 1.9764175415039062, 2.1600961685180664, 2.3437747955322266, 2.5274534225463867, 2.711132049560547]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 7.0, 5.0, 5.0, 11.0, 10.0, 16.0, 22.0, 17.0, 20.0, 14.0, 15.0, 18.0, 35.0, 27.0, 20.0, 26.0, 37.0, 43.0, 31.0, 43.0, 40.0, 39.0, 44.0, 32.0, 45.0, 37.0, 31.0, 42.0, 35.0, 24.0, 35.0, 20.0, 24.0, 16.0, 18.0, 14.0, 11.0, 19.0, 12.0, 11.0, 5.0, 8.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.0095295906066895, -1.940954327583313, -1.8723790645599365, -1.8038036823272705, -1.735228419303894, -1.6666531562805176, -1.5980777740478516, -1.529502511024475, -1.4609272480010986, -1.3923519849777222, -1.3237767219543457, -1.2552013397216797, -1.1866260766983032, -1.1180508136749268, -1.0494754314422607, -0.9809001684188843, -0.9123249053955078, -0.8437496423721313, -0.7751743197441101, -0.7065989971160889, -0.6380237340927124, -0.5694484710693359, -0.5008731484413147, -0.43229785561561584, -0.363722562789917, -0.29514726996421814, -0.2265719771385193, -0.15799668431282043, -0.08942139148712158, -0.02084609866142273, 0.04772919416427612, 0.11630448698997498, 0.18487954139709473, 0.2534548342227936, 0.32203012704849243, 0.3906054198741913, 0.45918071269989014, 0.5277559757232666, 0.5963312983512878, 0.6649066209793091, 0.7334818840026855, 0.802057147026062, 0.8706324696540833, 0.9392077922821045, 1.007783055305481, 1.0763583183288574, 1.1449337005615234, 1.2135089635849, 1.2820842266082764, 1.3506594896316528, 1.4192347526550293, 1.4878101348876953, 1.5563853979110718, 1.6249606609344482, 1.6935360431671143, 1.7621113061904907, 1.8306865692138672, 1.8992618322372437, 1.9678370952606201, 2.036412477493286, 2.104987621307373, 2.173563003540039, 2.242138385772705, 2.310713529586792, 2.379288911819458]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 13.0, 15.0, 14.0, 22.0, 31.0, 24.0, 41.0, 77.0, 123.0, 244.0, 471.0, 927.0, 1888.0, 4133.0, 9506.0, 22495.0, 54832.0, 134378.0, 275672.0, 288912.0, 148715.0, 61760.0, 24819.0, 10547.0, 4616.0, 2075.0, 991.0, 513.0, 268.0, 149.0, 87.0, 49.0, 33.0, 24.0, 23.0, 15.0, 14.0, 5.0, 5.0, 5.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0703125, -2.0076904296875, -1.945068359375, -1.8824462890625, -1.81982421875, -1.7572021484375, -1.694580078125, -1.6319580078125, -1.5693359375, -1.5067138671875, -1.444091796875, -1.3814697265625, -1.31884765625, -1.2562255859375, -1.193603515625, -1.1309814453125, -1.068359375, -1.0057373046875, -0.943115234375, -0.8804931640625, -0.81787109375, -0.7552490234375, -0.692626953125, -0.6300048828125, -0.5673828125, -0.5047607421875, -0.442138671875, -0.3795166015625, -0.31689453125, -0.2542724609375, -0.191650390625, -0.1290283203125, -0.06640625, -0.0037841796875, 0.058837890625, 0.1214599609375, 0.18408203125, 0.2467041015625, 0.309326171875, 0.3719482421875, 0.4345703125, 0.4971923828125, 0.559814453125, 0.6224365234375, 0.68505859375, 0.7476806640625, 0.810302734375, 0.8729248046875, 0.935546875, 0.9981689453125, 1.060791015625, 1.1234130859375, 1.18603515625, 1.2486572265625, 1.311279296875, 1.3739013671875, 1.4365234375, 1.4991455078125, 1.561767578125, 1.6243896484375, 1.68701171875, 1.7496337890625, 1.812255859375, 1.8748779296875, 1.9375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 11.0, 9.0, 12.0, 24.0, 24.0, 36.0, 25.0, 33.0, 32.0, 53.0, 58.0, 66.0, 65.0, 70.0, 63.0, 60.0, 56.0, 57.0, 47.0, 42.0, 42.0, 25.0, 26.0, 16.0, 13.0, 11.0, 7.0, 10.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6041183471679688, -0.5861663818359375, -0.5682144165039062, -0.550262451171875, -0.5323104858398438, -0.5143585205078125, -0.49640655517578125, -0.47845458984375, -0.46050262451171875, -0.4425506591796875, -0.42459869384765625, -0.406646728515625, -0.38869476318359375, -0.3707427978515625, -0.35279083251953125, -0.3348388671875, -0.31688690185546875, -0.2989349365234375, -0.28098297119140625, -0.263031005859375, -0.24507904052734375, -0.2271270751953125, -0.20917510986328125, -0.19122314453125, -0.17327117919921875, -0.1553192138671875, -0.13736724853515625, -0.119415283203125, -0.10146331787109375, -0.0835113525390625, -0.06555938720703125, -0.047607421875, -0.02965545654296875, -0.0117034912109375, 0.00624847412109375, 0.024200439453125, 0.04215240478515625, 0.0601043701171875, 0.07805633544921875, 0.09600830078125, 0.11396026611328125, 0.1319122314453125, 0.14986419677734375, 0.167816162109375, 0.18576812744140625, 0.2037200927734375, 0.22167205810546875, 0.2396240234375, 0.25757598876953125, 0.2755279541015625, 0.29347991943359375, 0.311431884765625, 0.32938385009765625, 0.3473358154296875, 0.36528778076171875, 0.38323974609375, 0.40119171142578125, 0.4191436767578125, 0.43709564208984375, 0.455047607421875, 0.47299957275390625, 0.4909515380859375, 0.5089035034179688, 0.52685546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 1.0, 13.0, 11.0, 18.0, 22.0, 34.0, 36.0, 38.0, 86.0, 101.0, 162.0, 240.0, 446.0, 671.0, 1198.0, 2149.0, 4088.0, 7706.0, 14700.0, 28591.0, 54606.0, 96781.0, 153603.0, 197925.0, 185874.0, 131288.0, 78126.0, 42709.0, 22395.0, 11543.0, 6021.0, 3132.0, 1747.0, 936.0, 602.0, 323.0, 215.0, 133.0, 81.0, 56.0, 37.0, 27.0, 24.0, 18.0, 12.0, 10.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.0629730224609375, -1.027313232421875, -0.9916534423828125, -0.95599365234375, -0.9203338623046875, -0.884674072265625, -0.8490142822265625, -0.8133544921875, -0.7776947021484375, -0.742034912109375, -0.7063751220703125, -0.67071533203125, -0.6350555419921875, -0.599395751953125, -0.5637359619140625, -0.528076171875, -0.4924163818359375, -0.456756591796875, -0.4210968017578125, -0.38543701171875, -0.3497772216796875, -0.314117431640625, -0.2784576416015625, -0.2427978515625, -0.2071380615234375, -0.171478271484375, -0.1358184814453125, -0.10015869140625, -0.0644989013671875, -0.028839111328125, 0.0068206787109375, 0.04248046875, 0.0781402587890625, 0.113800048828125, 0.1494598388671875, 0.18511962890625, 0.2207794189453125, 0.256439208984375, 0.2920989990234375, 0.3277587890625, 0.3634185791015625, 0.399078369140625, 0.4347381591796875, 0.47039794921875, 0.5060577392578125, 0.541717529296875, 0.5773773193359375, 0.613037109375, 0.6486968994140625, 0.684356689453125, 0.7200164794921875, 0.75567626953125, 0.7913360595703125, 0.826995849609375, 0.8626556396484375, 0.8983154296875, 0.9339752197265625, 0.969635009765625, 1.0052947998046875, 1.04095458984375, 1.0766143798828125, 1.112274169921875, 1.1479339599609375, 1.18359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 9.0, 5.0, 7.0, 4.0, 7.0, 8.0, 14.0, 21.0, 31.0, 26.0, 22.0, 33.0, 30.0, 39.0, 28.0, 35.0, 43.0, 39.0, 49.0, 54.0, 49.0, 39.0, 45.0, 38.0, 35.0, 60.0, 30.0, 30.0, 27.0, 15.0, 30.0, 19.0, 20.0, 11.0, 23.0, 10.0, 4.0, 4.0, 5.0, 2.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3857421875, -1.3457794189453125, -1.305816650390625, -1.2658538818359375, -1.22589111328125, -1.1859283447265625, -1.145965576171875, -1.1060028076171875, -1.0660400390625, -1.0260772705078125, -0.986114501953125, -0.9461517333984375, -0.90618896484375, -0.8662261962890625, -0.826263427734375, -0.7863006591796875, -0.746337890625, -0.7063751220703125, -0.666412353515625, -0.6264495849609375, -0.58648681640625, -0.5465240478515625, -0.506561279296875, -0.4665985107421875, -0.4266357421875, -0.3866729736328125, -0.346710205078125, -0.3067474365234375, -0.26678466796875, -0.2268218994140625, -0.186859130859375, -0.1468963623046875, -0.10693359375, -0.0669708251953125, -0.027008056640625, 0.0129547119140625, 0.05291748046875, 0.0928802490234375, 0.132843017578125, 0.1728057861328125, 0.2127685546875, 0.2527313232421875, 0.292694091796875, 0.3326568603515625, 0.37261962890625, 0.4125823974609375, 0.452545166015625, 0.4925079345703125, 0.532470703125, 0.5724334716796875, 0.612396240234375, 0.6523590087890625, 0.69232177734375, 0.7322845458984375, 0.772247314453125, 0.8122100830078125, 0.8521728515625, 0.8921356201171875, 0.932098388671875, 0.9720611572265625, 1.01202392578125, 1.0519866943359375, 1.091949462890625, 1.1319122314453125, 1.171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 11.0, 19.0, 20.0, 32.0, 49.0, 74.0, 113.0, 187.0, 289.0, 457.0, 687.0, 1121.0, 1729.0, 2955.0, 4815.0, 8327.0, 14426.0, 27075.0, 51342.0, 94790.0, 161400.0, 215671.0, 191871.0, 122276.0, 67950.0, 35514.0, 19009.0, 10479.0, 6101.0, 3709.0, 2220.0, 1385.0, 867.0, 542.0, 388.0, 224.0, 159.0, 82.0, 62.0, 42.0, 30.0, 18.0, 12.0, 7.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.50390625, -0.4885063171386719, -0.47310638427734375, -0.4577064514160156, -0.4423065185546875, -0.4269065856933594, -0.41150665283203125, -0.3961067199707031, -0.380706787109375, -0.3653068542480469, -0.34990692138671875, -0.3345069885253906, -0.3191070556640625, -0.3037071228027344, -0.28830718994140625, -0.2729072570800781, -0.25750732421875, -0.24210739135742188, -0.22670745849609375, -0.21130752563476562, -0.1959075927734375, -0.18050765991210938, -0.16510772705078125, -0.14970779418945312, -0.134307861328125, -0.11890792846679688, -0.10350799560546875, -0.08810806274414062, -0.0727081298828125, -0.057308197021484375, -0.04190826416015625, -0.026508331298828125, -0.0111083984375, 0.004291534423828125, 0.01969146728515625, 0.035091400146484375, 0.0504913330078125, 0.06589126586914062, 0.08129119873046875, 0.09669113159179688, 0.112091064453125, 0.12749099731445312, 0.14289093017578125, 0.15829086303710938, 0.1736907958984375, 0.18909072875976562, 0.20449066162109375, 0.21989059448242188, 0.23529052734375, 0.2506904602050781, 0.26609039306640625, 0.2814903259277344, 0.2968902587890625, 0.3122901916503906, 0.32769012451171875, 0.3430900573730469, 0.358489990234375, 0.3738899230957031, 0.38928985595703125, 0.4046897888183594, 0.4200897216796875, 0.4354896545410156, 0.45088958740234375, 0.4662895202636719, 0.481689453125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 16.0, 15.0, 18.0, 30.0, 49.0, 67.0, 90.0, 149.0, 171.0, 138.0, 101.0, 50.0, 35.0, 23.0, 13.0, 11.0, 7.0, 5.0, 9.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022411346435546875, -0.00021554529666900635, -0.00020697712898254395, -0.00019840896129608154, -0.00018984079360961914, -0.00018127262592315674, -0.00017270445823669434, -0.00016413629055023193, -0.00015556812286376953, -0.00014699995517730713, -0.00013843178749084473, -0.00012986361980438232, -0.00012129545211791992, -0.00011272728443145752, -0.00010415911674499512, -9.559094905853271e-05, -8.702278137207031e-05, -7.845461368560791e-05, -6.988644599914551e-05, -6.13182783126831e-05, -5.27501106262207e-05, -4.41819429397583e-05, -3.56137752532959e-05, -2.7045607566833496e-05, -1.8477439880371094e-05, -9.909272193908691e-06, -1.341104507446289e-06, 7.227063179016113e-06, 1.5795230865478516e-05, 2.4363398551940918e-05, 3.293156623840332e-05, 4.149973392486572e-05, 5.0067901611328125e-05, 5.863606929779053e-05, 6.720423698425293e-05, 7.577240467071533e-05, 8.434057235717773e-05, 9.290874004364014e-05, 0.00010147690773010254, 0.00011004507541656494, 0.00011861324310302734, 0.00012718141078948975, 0.00013574957847595215, 0.00014431774616241455, 0.00015288591384887695, 0.00016145408153533936, 0.00017002224922180176, 0.00017859041690826416, 0.00018715858459472656, 0.00019572675228118896, 0.00020429491996765137, 0.00021286308765411377, 0.00022143125534057617, 0.00022999942302703857, 0.00023856759071350098, 0.0002471357583999634, 0.0002557039260864258, 0.0002642720937728882, 0.0002728402614593506, 0.000281408429145813, 0.0002899765968322754, 0.0002985447645187378, 0.0003071129322052002, 0.0003156810998916626, 0.000324249267578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 12.0, 27.0, 37.0, 55.0, 70.0, 151.0, 249.0, 429.0, 814.0, 1276.0, 2360.0, 4484.0, 8927.0, 18729.0, 43721.0, 107511.0, 238961.0, 304476.0, 180875.0, 75499.0, 31195.0, 13969.0, 6849.0, 3458.0, 1860.0, 1095.0, 623.0, 352.0, 202.0, 113.0, 59.0, 35.0, 31.0, 10.0, 10.0, 9.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7041015625, -0.6847076416015625, -0.665313720703125, -0.6459197998046875, -0.62652587890625, -0.6071319580078125, -0.587738037109375, -0.5683441162109375, -0.5489501953125, -0.5295562744140625, -0.510162353515625, -0.4907684326171875, -0.47137451171875, -0.4519805908203125, -0.432586669921875, -0.4131927490234375, -0.393798828125, -0.3744049072265625, -0.355010986328125, -0.3356170654296875, -0.31622314453125, -0.2968292236328125, -0.277435302734375, -0.2580413818359375, -0.2386474609375, -0.2192535400390625, -0.199859619140625, -0.1804656982421875, -0.16107177734375, -0.1416778564453125, -0.122283935546875, -0.1028900146484375, -0.08349609375, -0.0641021728515625, -0.044708251953125, -0.0253143310546875, -0.00592041015625, 0.0134735107421875, 0.032867431640625, 0.0522613525390625, 0.0716552734375, 0.0910491943359375, 0.110443115234375, 0.1298370361328125, 0.14923095703125, 0.1686248779296875, 0.188018798828125, 0.2074127197265625, 0.226806640625, 0.2462005615234375, 0.265594482421875, 0.2849884033203125, 0.30438232421875, 0.3237762451171875, 0.343170166015625, 0.3625640869140625, 0.3819580078125, 0.4013519287109375, 0.420745849609375, 0.4401397705078125, 0.45953369140625, 0.4789276123046875, 0.498321533203125, 0.5177154541015625, 0.537109375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 10.0, 12.0, 18.0, 18.0, 31.0, 33.0, 47.0, 53.0, 72.0, 65.0, 72.0, 82.0, 71.0, 68.0, 63.0, 51.0, 39.0, 34.0, 30.0, 22.0, 18.0, 14.0, 15.0, 11.0, 9.0, 2.0, 5.0, 1.0, 4.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4208183288574219, -0.40438079833984375, -0.3879432678222656, -0.3715057373046875, -0.3550682067871094, -0.33863067626953125, -0.3221931457519531, -0.305755615234375, -0.2893180847167969, -0.27288055419921875, -0.2564430236816406, -0.2400054931640625, -0.22356796264648438, -0.20713043212890625, -0.19069290161132812, -0.17425537109375, -0.15781784057617188, -0.14138031005859375, -0.12494277954101562, -0.1085052490234375, -0.09206771850585938, -0.07563018798828125, -0.059192657470703125, -0.042755126953125, -0.026317596435546875, -0.00988006591796875, 0.006557464599609375, 0.0229949951171875, 0.039432525634765625, 0.05587005615234375, 0.07230758666992188, 0.0887451171875, 0.10518264770507812, 0.12162017822265625, 0.13805770874023438, 0.1544952392578125, 0.17093276977539062, 0.18737030029296875, 0.20380783081054688, 0.220245361328125, 0.23668289184570312, 0.25312042236328125, 0.2695579528808594, 0.2859954833984375, 0.3024330139160156, 0.31887054443359375, 0.3353080749511719, 0.35174560546875, 0.3681831359863281, 0.38462066650390625, 0.4010581970214844, 0.4174957275390625, 0.4339332580566406, 0.45037078857421875, 0.4668083190917969, 0.483245849609375, 0.4996833801269531, 0.5161209106445312, 0.5325584411621094, 0.5489959716796875, 0.5654335021972656, 0.5818710327148438, 0.5983085632324219, 0.61474609375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 11.0, 25.0, 23.0, 34.0, 41.0, 61.0, 71.0, 96.0, 103.0, 99.0, 81.0, 78.0, 60.0, 69.0, 35.0, 39.0, 25.0, 15.0, 14.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.17110013961792, -4.97287654876709, -4.774653434753418, -4.576429843902588, -4.378206253051758, -4.179983139038086, -3.981759548187256, -3.783536195755005, -3.585312843322754, -3.387089490890503, -3.188866138458252, -2.990642547607422, -2.792419195175171, -2.59419584274292, -2.39597225189209, -2.197748899459839, -1.999525547027588, -1.801302194595337, -1.6030787229537964, -1.4048552513122559, -1.2066318988800049, -1.008408546447754, -0.8101850748062134, -0.6119616031646729, -0.4137382507324219, -0.21551483869552612, -0.01729142665863037, 0.18093198537826538, 0.37915539741516113, 0.5773788094520569, 0.7756022214889526, 0.9738256931304932, 1.172048568725586, 1.370271921157837, 1.5684953927993774, 1.766718864440918, 1.964942216873169, 2.16316556930542, 2.36138916015625, 2.559612512588501, 2.757835865020752, 2.956059217453003, 3.154282569885254, 3.352506160736084, 3.550729513168335, 3.748952865600586, 3.947176456451416, 4.145400047302246, 4.343623161315918, 4.541846752166748, 4.74006986618042, 4.93829345703125, 5.136516571044922, 5.334740161895752, 5.532963752746582, 5.731186866760254, 5.929410457611084, 6.127634048461914, 6.325857162475586, 6.524080753326416, 6.722304344177246, 6.920527458190918, 7.118751049041748, 7.316974639892578, 7.51519775390625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 1.0, 9.0, 5.0, 10.0, 8.0, 9.0, 20.0, 12.0, 19.0, 26.0, 25.0, 33.0, 28.0, 29.0, 33.0, 26.0, 38.0, 46.0, 38.0, 46.0, 37.0, 43.0, 44.0, 52.0, 42.0, 30.0, 31.0, 28.0, 26.0, 25.0, 25.0, 30.0, 15.0, 16.0, 16.0, 16.0, 12.0, 16.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 6.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.271702766418457, -4.145228862762451, -4.018754959106445, -3.8922808170318604, -3.7658066749572754, -3.6393327713012695, -3.5128588676452637, -3.3863847255706787, -3.2599105834960938, -3.133436679840088, -3.006962537765503, -2.880488634109497, -2.754014492034912, -2.6275405883789062, -2.5010666847229004, -2.3745925426483154, -2.2481186389923096, -2.1216447353363037, -1.9951705932617188, -1.868696689605713, -1.742222547531128, -1.615748643875122, -1.4892746210098267, -1.3628005981445312, -1.2363265752792358, -1.1098525524139404, -0.983378529548645, -0.8569045662879944, -0.730430543422699, -0.6039565205574036, -0.47748255729675293, -0.3510085344314575, -0.224534273147583, -0.09806026518344879, 0.028413742780685425, 0.15488773584365845, 0.28136175870895386, 0.40783578157424927, 0.5343097448348999, 0.6607837677001953, 0.7872577905654907, 0.9137318134307861, 1.0402058362960815, 1.166679859161377, 1.2931537628173828, 1.4196279048919678, 1.5461018085479736, 1.672575831413269, 1.7990498542785645, 1.9255238771438599, 2.0519979000091553, 2.178471803665161, 2.304945945739746, 2.431419849395752, 2.557893753051758, 2.6843678951263428, 2.8108420372009277, 2.9373159408569336, 3.0637900829315186, 3.1902639865875244, 3.3167381286621094, 3.4432120323181152, 3.569685935974121, 3.696160078048706, 3.822633981704712]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 6.0, 10.0, 7.0, 19.0, 19.0, 28.0, 30.0, 49.0, 77.0, 82.0, 156.0, 240.0, 398.0, 743.0, 1205.0, 2241.0, 4496.0, 9446.0, 21464.0, 53085.0, 149097.0, 484720.0, 1398976.0, 1364268.0, 467058.0, 144183.0, 52165.0, 21212.0, 9389.0, 4324.0, 2185.0, 1229.0, 652.0, 374.0, 236.0, 142.0, 98.0, 52.0, 36.0, 28.0, 16.0, 14.0, 8.0, 11.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.80078125, -0.7765045166015625, -0.752227783203125, -0.7279510498046875, -0.70367431640625, -0.6793975830078125, -0.655120849609375, -0.6308441162109375, -0.6065673828125, -0.5822906494140625, -0.558013916015625, -0.5337371826171875, -0.50946044921875, -0.4851837158203125, -0.460906982421875, -0.4366302490234375, -0.412353515625, -0.3880767822265625, -0.363800048828125, -0.3395233154296875, -0.31524658203125, -0.2909698486328125, -0.266693115234375, -0.2424163818359375, -0.2181396484375, -0.1938629150390625, -0.169586181640625, -0.1453094482421875, -0.12103271484375, -0.0967559814453125, -0.072479248046875, -0.0482025146484375, -0.02392578125, 0.0003509521484375, 0.024627685546875, 0.0489044189453125, 0.07318115234375, 0.0974578857421875, 0.121734619140625, 0.1460113525390625, 0.1702880859375, 0.1945648193359375, 0.218841552734375, 0.2431182861328125, 0.26739501953125, 0.2916717529296875, 0.315948486328125, 0.3402252197265625, 0.364501953125, 0.3887786865234375, 0.413055419921875, 0.4373321533203125, 0.46160888671875, 0.4858856201171875, 0.510162353515625, 0.5344390869140625, 0.5587158203125, 0.5829925537109375, 0.607269287109375, 0.6315460205078125, 0.65582275390625, 0.6800994873046875, 0.704376220703125, 0.7286529541015625, 0.7529296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 13.0, 11.0, 9.0, 6.0, 11.0, 18.0, 14.0, 28.0, 24.0, 23.0, 32.0, 36.0, 35.0, 33.0, 45.0, 42.0, 48.0, 51.0, 32.0, 34.0, 37.0, 33.0, 32.0, 41.0, 41.0, 50.0, 38.0, 30.0, 28.0, 16.0, 20.0, 17.0, 14.0, 11.0, 6.0, 9.0, 9.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5141258239746094, -0.49846649169921875, -0.4828071594238281, -0.4671478271484375, -0.4514884948730469, -0.43582916259765625, -0.4201698303222656, -0.404510498046875, -0.3888511657714844, -0.37319183349609375, -0.3575325012207031, -0.3418731689453125, -0.3262138366699219, -0.31055450439453125, -0.2948951721191406, -0.27923583984375, -0.2635765075683594, -0.24791717529296875, -0.23225784301757812, -0.2165985107421875, -0.20093917846679688, -0.18527984619140625, -0.16962051391601562, -0.153961181640625, -0.13830184936523438, -0.12264251708984375, -0.10698318481445312, -0.0913238525390625, -0.07566452026367188, -0.06000518798828125, -0.044345855712890625, -0.0286865234375, -0.013027191162109375, 0.00263214111328125, 0.018291473388671875, 0.0339508056640625, 0.049610137939453125, 0.06526947021484375, 0.08092880249023438, 0.096588134765625, 0.11224746704101562, 0.12790679931640625, 0.14356613159179688, 0.1592254638671875, 0.17488479614257812, 0.19054412841796875, 0.20620346069335938, 0.22186279296875, 0.23752212524414062, 0.25318145751953125, 0.2688407897949219, 0.2845001220703125, 0.3001594543457031, 0.31581878662109375, 0.3314781188964844, 0.347137451171875, 0.3627967834472656, 0.37845611572265625, 0.3941154479980469, 0.4097747802734375, 0.4254341125488281, 0.44109344482421875, 0.4567527770996094, 0.472412109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 9.0, 14.0, 16.0, 37.0, 40.0, 81.0, 139.0, 253.0, 573.0, 1205.0, 2704.0, 6994.0, 19700.0, 69792.0, 301988.0, 1360706.0, 1821736.0, 463378.0, 102082.0, 27342.0, 9100.0, 3500.0, 1468.0, 673.0, 327.0, 168.0, 90.0, 58.0, 44.0, 22.0, 18.0, 10.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3671875, -1.328277587890625, -1.28936767578125, -1.250457763671875, -1.2115478515625, -1.172637939453125, -1.13372802734375, -1.094818115234375, -1.055908203125, -1.016998291015625, -0.97808837890625, -0.939178466796875, -0.9002685546875, -0.861358642578125, -0.82244873046875, -0.783538818359375, -0.74462890625, -0.705718994140625, -0.66680908203125, -0.627899169921875, -0.5889892578125, -0.550079345703125, -0.51116943359375, -0.472259521484375, -0.433349609375, -0.394439697265625, -0.35552978515625, -0.316619873046875, -0.2777099609375, -0.238800048828125, -0.19989013671875, -0.160980224609375, -0.1220703125, -0.083160400390625, -0.04425048828125, -0.005340576171875, 0.0335693359375, 0.072479248046875, 0.11138916015625, 0.150299072265625, 0.189208984375, 0.228118896484375, 0.26702880859375, 0.305938720703125, 0.3448486328125, 0.383758544921875, 0.42266845703125, 0.461578369140625, 0.50048828125, 0.539398193359375, 0.57830810546875, 0.617218017578125, 0.6561279296875, 0.695037841796875, 0.73394775390625, 0.772857666015625, 0.811767578125, 0.850677490234375, 0.88958740234375, 0.928497314453125, 0.9674072265625, 1.006317138671875, 1.04522705078125, 1.084136962890625, 1.123046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 8.0, 6.0, 6.0, 7.0, 25.0, 30.0, 39.0, 55.0, 72.0, 106.0, 154.0, 181.0, 236.0, 341.0, 386.0, 441.0, 434.0, 397.0, 297.0, 222.0, 172.0, 147.0, 85.0, 53.0, 47.0, 38.0, 23.0, 20.0, 13.0, 9.0, 6.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8935546875, -0.8614654541015625, -0.829376220703125, -0.7972869873046875, -0.76519775390625, -0.7331085205078125, -0.701019287109375, -0.6689300537109375, -0.6368408203125, -0.6047515869140625, -0.572662353515625, -0.5405731201171875, -0.50848388671875, -0.4763946533203125, -0.444305419921875, -0.4122161865234375, -0.380126953125, -0.3480377197265625, -0.315948486328125, -0.2838592529296875, -0.25177001953125, -0.2196807861328125, -0.187591552734375, -0.1555023193359375, -0.1234130859375, -0.0913238525390625, -0.059234619140625, -0.0271453857421875, 0.00494384765625, 0.0370330810546875, 0.069122314453125, 0.1012115478515625, 0.13330078125, 0.1653900146484375, 0.197479248046875, 0.2295684814453125, 0.26165771484375, 0.2937469482421875, 0.325836181640625, 0.3579254150390625, 0.3900146484375, 0.4221038818359375, 0.454193115234375, 0.4862823486328125, 0.51837158203125, 0.5504608154296875, 0.582550048828125, 0.6146392822265625, 0.646728515625, 0.6788177490234375, 0.710906982421875, 0.7429962158203125, 0.77508544921875, 0.8071746826171875, 0.839263916015625, 0.8713531494140625, 0.9034423828125, 0.9355316162109375, 0.967620849609375, 0.9997100830078125, 1.03179931640625, 1.0638885498046875, 1.095977783203125, 1.1280670166015625, 1.16015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 12.0, 17.0, 21.0, 45.0, 61.0, 92.0, 134.0, 149.0, 125.0, 122.0, 93.0, 68.0, 29.0, 16.0, 14.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.489984512329102, -10.234557151794434, -9.979129791259766, -9.723702430725098, -9.46827507019043, -9.212847709655762, -8.957420349121094, -8.701992988586426, -8.446565628051758, -8.19113826751709, -7.935710906982422, -7.680283546447754, -7.424856185913086, -7.169428825378418, -6.91400146484375, -6.658574104309082, -6.403146743774414, -6.147719383239746, -5.892292022705078, -5.63686466217041, -5.381437301635742, -5.126009941101074, -4.870582580566406, -4.615155220031738, -4.35972785949707, -4.104300498962402, -3.8488731384277344, -3.5934457778930664, -3.3380184173583984, -3.0825910568237305, -2.8271636962890625, -2.5717363357543945, -2.3163089752197266, -2.0608816146850586, -1.8054542541503906, -1.5500268936157227, -1.2945995330810547, -1.0391721725463867, -0.7837448120117188, -0.5283174514770508, -0.2728900909423828, -0.017462730407714844, 0.23796463012695312, 0.4933919906616211, 0.7488193511962891, 1.004246711730957, 1.259674072265625, 1.515101432800293, 1.770528793334961, 2.025956153869629, 2.281383514404297, 2.536810874938965, 2.792238235473633, 3.047665596008301, 3.3030929565429688, 3.5585203170776367, 3.8139476776123047, 4.069375038146973, 4.324802398681641, 4.580229759216309, 4.835657119750977, 5.0910844802856445, 5.3465118408203125, 5.6019392013549805, 5.857366561889648]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 4.0, 6.0, 10.0, 10.0, 11.0, 10.0, 14.0, 19.0, 20.0, 29.0, 17.0, 27.0, 35.0, 33.0, 42.0, 40.0, 44.0, 36.0, 28.0, 39.0, 42.0, 44.0, 44.0, 42.0, 33.0, 32.0, 31.0, 27.0, 32.0, 22.0, 25.0, 22.0, 20.0, 15.0, 15.0, 12.0, 14.0, 7.0, 17.0, 1.0, 6.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8077805042266846, -2.7121710777282715, -2.6165616512298584, -2.5209522247314453, -2.4253427982330322, -2.329733371734619, -2.234124183654785, -2.138514518737793, -2.042905330657959, -1.947295904159546, -1.8516864776611328, -1.7560770511627197, -1.6604676246643066, -1.5648581981658936, -1.46924889087677, -1.373639464378357, -1.2780299186706543, -1.1824204921722412, -1.0868110656738281, -0.9912016987800598, -0.8955922722816467, -0.7999828457832336, -0.7043734788894653, -0.6087640523910522, -0.5131546258926392, -0.4175451993942261, -0.3219358026981354, -0.22632640600204468, -0.1307169795036316, -0.035107553005218506, 0.060501813888549805, 0.1561112403869629, 0.2517204284667969, 0.34732985496520996, 0.44293925166130066, 0.5385486483573914, 0.6341580748558044, 0.7297675013542175, 0.8253768682479858, 0.9209862947463989, 1.016595721244812, 1.112205147743225, 1.2078145742416382, 1.3034238815307617, 1.3990333080291748, 1.494642734527588, 1.590252161026001, 1.685861587524414, 1.7814710140228271, 1.8770804405212402, 1.9726898670196533, 2.0682992935180664, 2.1639087200164795, 2.2595181465148926, 2.3551273345947266, 2.4507369995117188, 2.5463461875915527, 2.641955614089966, 2.737565040588379, 2.833174467086792, 2.928783893585205, 3.024393320083618, 3.1200027465820312, 3.2156119346618652, 3.3112215995788574]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 10.0, 11.0, 18.0, 23.0, 33.0, 42.0, 91.0, 141.0, 208.0, 346.0, 608.0, 1115.0, 2034.0, 3746.0, 7032.0, 13489.0, 25649.0, 51137.0, 113790.0, 236496.0, 283107.0, 163006.0, 72681.0, 35076.0, 18059.0, 9497.0, 4996.0, 2727.0, 1447.0, 791.0, 417.0, 278.0, 158.0, 85.0, 62.0, 38.0, 24.0, 23.0, 15.0, 14.0, 5.0, 8.0, 8.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.5458984375, -1.500732421875, -1.45556640625, -1.410400390625, -1.365234375, -1.320068359375, -1.27490234375, -1.229736328125, -1.1845703125, -1.139404296875, -1.09423828125, -1.049072265625, -1.00390625, -0.958740234375, -0.91357421875, -0.868408203125, -0.8232421875, -0.778076171875, -0.73291015625, -0.687744140625, -0.642578125, -0.597412109375, -0.55224609375, -0.507080078125, -0.4619140625, -0.416748046875, -0.37158203125, -0.326416015625, -0.28125, -0.236083984375, -0.19091796875, -0.145751953125, -0.1005859375, -0.055419921875, -0.01025390625, 0.034912109375, 0.080078125, 0.125244140625, 0.17041015625, 0.215576171875, 0.2607421875, 0.305908203125, 0.35107421875, 0.396240234375, 0.44140625, 0.486572265625, 0.53173828125, 0.576904296875, 0.6220703125, 0.667236328125, 0.71240234375, 0.757568359375, 0.802734375, 0.847900390625, 0.89306640625, 0.938232421875, 0.9833984375, 1.028564453125, 1.07373046875, 1.118896484375, 1.1640625, 1.209228515625, 1.25439453125, 1.299560546875, 1.3447265625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 4.0, 6.0, 9.0, 8.0, 18.0, 20.0, 18.0, 21.0, 28.0, 35.0, 34.0, 40.0, 34.0, 37.0, 43.0, 42.0, 48.0, 46.0, 51.0, 52.0, 47.0, 56.0, 41.0, 45.0, 32.0, 30.0, 24.0, 17.0, 25.0, 17.0, 13.0, 14.0, 8.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.58349609375, -0.5666732788085938, -0.5498504638671875, -0.5330276489257812, -0.516204833984375, -0.49938201904296875, -0.4825592041015625, -0.46573638916015625, -0.44891357421875, -0.43209075927734375, -0.4152679443359375, -0.39844512939453125, -0.381622314453125, -0.36479949951171875, -0.3479766845703125, -0.33115386962890625, -0.3143310546875, -0.29750823974609375, -0.2806854248046875, -0.26386260986328125, -0.247039794921875, -0.23021697998046875, -0.2133941650390625, -0.19657135009765625, -0.17974853515625, -0.16292572021484375, -0.1461029052734375, -0.12928009033203125, -0.112457275390625, -0.09563446044921875, -0.0788116455078125, -0.06198883056640625, -0.045166015625, -0.02834320068359375, -0.0115203857421875, 0.00530242919921875, 0.022125244140625, 0.03894805908203125, 0.0557708740234375, 0.07259368896484375, 0.08941650390625, 0.10623931884765625, 0.1230621337890625, 0.13988494873046875, 0.156707763671875, 0.17353057861328125, 0.1903533935546875, 0.20717620849609375, 0.2239990234375, 0.24082183837890625, 0.2576446533203125, 0.27446746826171875, 0.291290283203125, 0.30811309814453125, 0.3249359130859375, 0.34175872802734375, 0.35858154296875, 0.37540435791015625, 0.3922271728515625, 0.40904998779296875, 0.425872802734375, 0.44269561767578125, 0.4595184326171875, 0.47634124755859375, 0.4931640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 16.0, 20.0, 15.0, 20.0, 32.0, 43.0, 58.0, 78.0, 117.0, 196.0, 305.0, 638.0, 1374.0, 3460.0, 8837.0, 23181.0, 61522.0, 172430.0, 367349.0, 259109.0, 93295.0, 34109.0, 13321.0, 5068.0, 1993.0, 863.0, 457.0, 221.0, 115.0, 93.0, 62.0, 39.0, 40.0, 19.0, 17.0, 16.0, 8.0, 6.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.861328125, -1.8061065673828125, -1.750885009765625, -1.6956634521484375, -1.64044189453125, -1.5852203369140625, -1.529998779296875, -1.4747772216796875, -1.4195556640625, -1.3643341064453125, -1.309112548828125, -1.2538909912109375, -1.19866943359375, -1.1434478759765625, -1.088226318359375, -1.0330047607421875, -0.977783203125, -0.9225616455078125, -0.867340087890625, -0.8121185302734375, -0.75689697265625, -0.7016754150390625, -0.646453857421875, -0.5912322998046875, -0.5360107421875, -0.4807891845703125, -0.425567626953125, -0.3703460693359375, -0.31512451171875, -0.2599029541015625, -0.204681396484375, -0.1494598388671875, -0.09423828125, -0.0390167236328125, 0.016204833984375, 0.0714263916015625, 0.12664794921875, 0.1818695068359375, 0.237091064453125, 0.2923126220703125, 0.3475341796875, 0.4027557373046875, 0.457977294921875, 0.5131988525390625, 0.56842041015625, 0.6236419677734375, 0.678863525390625, 0.7340850830078125, 0.789306640625, 0.8445281982421875, 0.899749755859375, 0.9549713134765625, 1.01019287109375, 1.0654144287109375, 1.120635986328125, 1.1758575439453125, 1.2310791015625, 1.2863006591796875, 1.341522216796875, 1.3967437744140625, 1.45196533203125, 1.5071868896484375, 1.562408447265625, 1.6176300048828125, 1.6728515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 13.0, 13.0, 11.0, 10.0, 15.0, 13.0, 20.0, 26.0, 19.0, 32.0, 29.0, 34.0, 37.0, 41.0, 49.0, 30.0, 34.0, 47.0, 32.0, 42.0, 34.0, 36.0, 28.0, 31.0, 32.0, 30.0, 27.0, 23.0, 16.0, 30.0, 17.0, 14.0, 18.0, 22.0, 21.0, 10.0, 10.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2412109375, -1.201324462890625, -1.16143798828125, -1.121551513671875, -1.0816650390625, -1.041778564453125, -1.00189208984375, -0.962005615234375, -0.922119140625, -0.882232666015625, -0.84234619140625, -0.802459716796875, -0.7625732421875, -0.722686767578125, -0.68280029296875, -0.642913818359375, -0.60302734375, -0.563140869140625, -0.52325439453125, -0.483367919921875, -0.4434814453125, -0.403594970703125, -0.36370849609375, -0.323822021484375, -0.283935546875, -0.244049072265625, -0.20416259765625, -0.164276123046875, -0.1243896484375, -0.084503173828125, -0.04461669921875, -0.004730224609375, 0.03515625, 0.075042724609375, 0.11492919921875, 0.154815673828125, 0.1947021484375, 0.234588623046875, 0.27447509765625, 0.314361572265625, 0.354248046875, 0.394134521484375, 0.43402099609375, 0.473907470703125, 0.5137939453125, 0.553680419921875, 0.59356689453125, 0.633453369140625, 0.67333984375, 0.713226318359375, 0.75311279296875, 0.792999267578125, 0.8328857421875, 0.872772216796875, 0.91265869140625, 0.952545166015625, 0.992431640625, 1.032318115234375, 1.07220458984375, 1.112091064453125, 1.1519775390625, 1.191864013671875, 1.23175048828125, 1.271636962890625, 1.3115234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 9.0, 12.0, 20.0, 26.0, 54.0, 91.0, 144.0, 234.0, 324.0, 652.0, 1144.0, 2059.0, 3763.0, 6780.0, 12031.0, 20953.0, 37554.0, 68929.0, 123811.0, 194560.0, 215353.0, 156962.0, 90643.0, 49561.0, 27591.0, 15379.0, 8675.0, 4885.0, 2629.0, 1579.0, 916.0, 477.0, 305.0, 174.0, 94.0, 70.0, 30.0, 30.0, 15.0, 8.0, 11.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.576171875, -0.5602684020996094, -0.5443649291992188, -0.5284614562988281, -0.5125579833984375, -0.4966545104980469, -0.48075103759765625, -0.4648475646972656, -0.448944091796875, -0.4330406188964844, -0.41713714599609375, -0.4012336730957031, -0.3853302001953125, -0.3694267272949219, -0.35352325439453125, -0.3376197814941406, -0.32171630859375, -0.3058128356933594, -0.28990936279296875, -0.2740058898925781, -0.2581024169921875, -0.24219894409179688, -0.22629547119140625, -0.21039199829101562, -0.194488525390625, -0.17858505249023438, -0.16268157958984375, -0.14677810668945312, -0.1308746337890625, -0.11497116088867188, -0.09906768798828125, -0.08316421508789062, -0.0672607421875, -0.051357269287109375, -0.03545379638671875, -0.019550323486328125, -0.0036468505859375, 0.012256622314453125, 0.02816009521484375, 0.044063568115234375, 0.059967041015625, 0.07587051391601562, 0.09177398681640625, 0.10767745971679688, 0.1235809326171875, 0.13948440551757812, 0.15538787841796875, 0.17129135131835938, 0.18719482421875, 0.20309829711914062, 0.21900177001953125, 0.23490524291992188, 0.2508087158203125, 0.2667121887207031, 0.28261566162109375, 0.2985191345214844, 0.314422607421875, 0.3303260803222656, 0.34622955322265625, 0.3621330261230469, 0.3780364990234375, 0.3939399719238281, 0.40984344482421875, 0.4257469177246094, 0.441650390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 13.0, 13.0, 22.0, 24.0, 23.0, 51.0, 58.0, 66.0, 94.0, 118.0, 107.0, 97.0, 71.0, 49.0, 50.0, 29.0, 23.0, 13.0, 13.0, 9.0, 7.0, 9.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020575523376464844, -0.00020033493638038635, -0.00019491463899612427, -0.00018949434161186218, -0.0001840740442276001, -0.000178653746843338, -0.00017323344945907593, -0.00016781315207481384, -0.00016239285469055176, -0.00015697255730628967, -0.0001515522599220276, -0.0001461319625377655, -0.00014071166515350342, -0.00013529136776924133, -0.00012987107038497925, -0.00012445077300071716, -0.00011903047561645508, -0.00011361017823219299, -0.00010818988084793091, -0.00010276958346366882, -9.734928607940674e-05, -9.192898869514465e-05, -8.650869131088257e-05, -8.108839392662048e-05, -7.56680965423584e-05, -7.024779915809631e-05, -6.482750177383423e-05, -5.9407204389572144e-05, -5.398690700531006e-05, -4.8566609621047974e-05, -4.314631223678589e-05, -3.7726014852523804e-05, -3.230571746826172e-05, -2.6885420083999634e-05, -2.146512269973755e-05, -1.6044825315475464e-05, -1.0624527931213379e-05, -5.204230546951294e-06, 2.1606683731079102e-07, 5.636364221572876e-06, 1.1056661605834961e-05, 1.6476958990097046e-05, 2.189725637435913e-05, 2.7317553758621216e-05, 3.27378511428833e-05, 3.8158148527145386e-05, 4.357844591140747e-05, 4.8998743295669556e-05, 5.441904067993164e-05, 5.9839338064193726e-05, 6.525963544845581e-05, 7.06799328327179e-05, 7.610023021697998e-05, 8.152052760124207e-05, 8.694082498550415e-05, 9.236112236976624e-05, 9.778141975402832e-05, 0.0001032017171382904, 0.00010862201452255249, 0.00011404231190681458, 0.00011946260929107666, 0.00012488290667533875, 0.00013030320405960083, 0.00013572350144386292, 0.000141143798828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 2.0, 7.0, 15.0, 14.0, 28.0, 35.0, 56.0, 87.0, 132.0, 225.0, 352.0, 604.0, 1182.0, 2200.0, 4424.0, 8847.0, 17532.0, 35444.0, 73051.0, 160325.0, 280863.0, 238636.0, 116816.0, 54140.0, 26704.0, 13201.0, 6550.0, 3390.0, 1604.0, 873.0, 478.0, 274.0, 165.0, 107.0, 78.0, 37.0, 25.0, 15.0, 15.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5432891845703125, -0.525054931640625, -0.5068206787109375, -0.48858642578125, -0.4703521728515625, -0.452117919921875, -0.4338836669921875, -0.4156494140625, -0.3974151611328125, -0.379180908203125, -0.3609466552734375, -0.34271240234375, -0.3244781494140625, -0.306243896484375, -0.2880096435546875, -0.269775390625, -0.2515411376953125, -0.233306884765625, -0.2150726318359375, -0.19683837890625, -0.1786041259765625, -0.160369873046875, -0.1421356201171875, -0.1239013671875, -0.1056671142578125, -0.087432861328125, -0.0691986083984375, -0.05096435546875, -0.0327301025390625, -0.014495849609375, 0.0037384033203125, 0.02197265625, 0.0402069091796875, 0.058441162109375, 0.0766754150390625, 0.09490966796875, 0.1131439208984375, 0.131378173828125, 0.1496124267578125, 0.1678466796875, 0.1860809326171875, 0.204315185546875, 0.2225494384765625, 0.24078369140625, 0.2590179443359375, 0.277252197265625, 0.2954864501953125, 0.313720703125, 0.3319549560546875, 0.350189208984375, 0.3684234619140625, 0.38665771484375, 0.4048919677734375, 0.423126220703125, 0.4413604736328125, 0.4595947265625, 0.4778289794921875, 0.496063232421875, 0.5142974853515625, 0.53253173828125, 0.5507659912109375, 0.569000244140625, 0.5872344970703125, 0.60546875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 5.0, 11.0, 17.0, 21.0, 26.0, 28.0, 32.0, 47.0, 38.0, 53.0, 80.0, 65.0, 71.0, 77.0, 81.0, 42.0, 59.0, 43.0, 36.0, 37.0, 26.0, 17.0, 19.0, 12.0, 10.0, 9.0, 5.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.61083984375, -0.5916900634765625, -0.572540283203125, -0.5533905029296875, -0.53424072265625, -0.5150909423828125, -0.495941162109375, -0.4767913818359375, -0.4576416015625, -0.4384918212890625, -0.419342041015625, -0.4001922607421875, -0.38104248046875, -0.3618927001953125, -0.342742919921875, -0.3235931396484375, -0.304443359375, -0.2852935791015625, -0.266143798828125, -0.2469940185546875, -0.22784423828125, -0.2086944580078125, -0.189544677734375, -0.1703948974609375, -0.1512451171875, -0.1320953369140625, -0.112945556640625, -0.0937957763671875, -0.07464599609375, -0.0554962158203125, -0.036346435546875, -0.0171966552734375, 0.001953125, 0.0211029052734375, 0.040252685546875, 0.0594024658203125, 0.07855224609375, 0.0977020263671875, 0.116851806640625, 0.1360015869140625, 0.1551513671875, 0.1743011474609375, 0.193450927734375, 0.2126007080078125, 0.23175048828125, 0.2509002685546875, 0.270050048828125, 0.2891998291015625, 0.308349609375, 0.3274993896484375, 0.346649169921875, 0.3657989501953125, 0.38494873046875, 0.4040985107421875, 0.423248291015625, 0.4423980712890625, 0.4615478515625, 0.4806976318359375, 0.499847412109375, 0.5189971923828125, 0.53814697265625, 0.5572967529296875, 0.576446533203125, 0.5955963134765625, 0.61474609375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 10.0, 22.0, 39.0, 58.0, 87.0, 102.0, 137.0, 104.0, 131.0, 100.0, 66.0, 53.0, 41.0, 23.0, 15.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.263677597045898, -10.009865760803223, -9.756053924560547, -9.502243041992188, -9.248431205749512, -8.994619369506836, -8.740808486938477, -8.4869966506958, -8.233184814453125, -7.979372978210449, -7.725561618804932, -7.471750259399414, -7.217938423156738, -6.9641265869140625, -6.710315227508545, -6.456503868103027, -6.202692031860352, -5.948880195617676, -5.695068836212158, -5.441257476806641, -5.187445640563965, -4.933633804321289, -4.6798224449157715, -4.426011085510254, -4.172199249267578, -3.9183876514434814, -3.6645760536193848, -3.410764455795288, -3.1569528579711914, -2.9031412601470947, -2.649329662322998, -2.3955180644989014, -2.1417064666748047, -1.887894868850708, -1.6340832710266113, -1.3802716732025146, -1.126460075378418, -0.8726484775543213, -0.6188368797302246, -0.36502528190612793, -0.11121368408203125, 0.14259791374206543, 0.3964095115661621, 0.6502211093902588, 0.9040327072143555, 1.1578443050384521, 1.4116559028625488, 1.6654675006866455, 1.9192790985107422, 2.173090696334839, 2.4269022941589355, 2.6807138919830322, 2.934525489807129, 3.1883370876312256, 3.4421486854553223, 3.695960283279419, 3.9497718811035156, 4.203583717346191, 4.457395076751709, 4.711206436157227, 4.965018272399902, 5.218830108642578, 5.472641468048096, 5.726452827453613, 5.980264663696289]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 4.0, 9.0, 11.0, 15.0, 16.0, 12.0, 16.0, 17.0, 34.0, 31.0, 35.0, 26.0, 36.0, 40.0, 40.0, 45.0, 47.0, 52.0, 37.0, 40.0, 47.0, 33.0, 51.0, 36.0, 35.0, 45.0, 24.0, 29.0, 18.0, 21.0, 13.0, 17.0, 10.0, 14.0, 10.0, 5.0, 10.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.538846969604492, -4.402700424194336, -4.26655387878418, -4.130407333374023, -3.994260787963867, -3.858114242553711, -3.7219676971435547, -3.5858211517333984, -3.449674606323242, -3.313528060913086, -3.1773815155029297, -3.0412349700927734, -2.905088424682617, -2.768941879272461, -2.6327953338623047, -2.4966487884521484, -2.360502243041992, -2.224355697631836, -2.0882091522216797, -1.9520626068115234, -1.8159160614013672, -1.679769515991211, -1.5436229705810547, -1.4074764251708984, -1.2713298797607422, -1.135183334350586, -0.9990367889404297, -0.8628902435302734, -0.7267436981201172, -0.5905971527099609, -0.4544506072998047, -0.31830406188964844, -0.1821575164794922, -0.04601097106933594, 0.09013557434082031, 0.22628211975097656, 0.3624286651611328, 0.49857521057128906, 0.6347217559814453, 0.7708683013916016, 0.9070148468017578, 1.043161392211914, 1.1793079376220703, 1.3154544830322266, 1.4516010284423828, 1.587747573852539, 1.7238941192626953, 1.8600406646728516, 1.9961872100830078, 2.132333755493164, 2.2684803009033203, 2.4046268463134766, 2.540773391723633, 2.676919937133789, 2.8130664825439453, 2.9492130279541016, 3.085359573364258, 3.221506118774414, 3.3576526641845703, 3.4937992095947266, 3.629945755004883, 3.766092300415039, 3.9022388458251953, 4.038385391235352, 4.174531936645508]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 5.0, 11.0, 17.0, 31.0, 45.0, 83.0, 142.0, 284.0, 556.0, 1168.0, 2569.0, 6169.0, 17306.0, 56259.0, 227913.0, 1117047.0, 2029512.0, 561854.0, 120993.0, 33421.0, 11226.0, 4366.0, 1764.0, 747.0, 385.0, 191.0, 110.0, 41.0, 21.0, 22.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2314453125, -1.195526123046875, -1.15960693359375, -1.123687744140625, -1.0877685546875, -1.051849365234375, -1.01593017578125, -0.980010986328125, -0.944091796875, -0.908172607421875, -0.87225341796875, -0.836334228515625, -0.8004150390625, -0.764495849609375, -0.72857666015625, -0.692657470703125, -0.65673828125, -0.620819091796875, -0.58489990234375, -0.548980712890625, -0.5130615234375, -0.477142333984375, -0.44122314453125, -0.405303955078125, -0.369384765625, -0.333465576171875, -0.29754638671875, -0.261627197265625, -0.2257080078125, -0.189788818359375, -0.15386962890625, -0.117950439453125, -0.08203125, -0.046112060546875, -0.01019287109375, 0.025726318359375, 0.0616455078125, 0.097564697265625, 0.13348388671875, 0.169403076171875, 0.205322265625, 0.241241455078125, 0.27716064453125, 0.313079833984375, 0.3489990234375, 0.384918212890625, 0.42083740234375, 0.456756591796875, 0.49267578125, 0.528594970703125, 0.56451416015625, 0.600433349609375, 0.6363525390625, 0.672271728515625, 0.70819091796875, 0.744110107421875, 0.780029296875, 0.815948486328125, 0.85186767578125, 0.887786865234375, 0.9237060546875, 0.959625244140625, 0.99554443359375, 1.031463623046875, 1.0673828125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 9.0, 7.0, 15.0, 18.0, 17.0, 24.0, 32.0, 43.0, 43.0, 32.0, 37.0, 55.0, 49.0, 64.0, 48.0, 60.0, 63.0, 45.0, 49.0, 57.0, 46.0, 33.0, 30.0, 22.0, 16.0, 20.0, 8.0, 18.0, 9.0, 9.0, 10.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7373046875, -0.7155303955078125, -0.693756103515625, -0.6719818115234375, -0.65020751953125, -0.6284332275390625, -0.606658935546875, -0.5848846435546875, -0.5631103515625, -0.5413360595703125, -0.519561767578125, -0.4977874755859375, -0.47601318359375, -0.4542388916015625, -0.432464599609375, -0.4106903076171875, -0.388916015625, -0.3671417236328125, -0.345367431640625, -0.3235931396484375, -0.30181884765625, -0.2800445556640625, -0.258270263671875, -0.2364959716796875, -0.2147216796875, -0.1929473876953125, -0.171173095703125, -0.1493988037109375, -0.12762451171875, -0.1058502197265625, -0.084075927734375, -0.0623016357421875, -0.04052734375, -0.0187530517578125, 0.003021240234375, 0.0247955322265625, 0.04656982421875, 0.0683441162109375, 0.090118408203125, 0.1118927001953125, 0.1336669921875, 0.1554412841796875, 0.177215576171875, 0.1989898681640625, 0.22076416015625, 0.2425384521484375, 0.264312744140625, 0.2860870361328125, 0.307861328125, 0.3296356201171875, 0.351409912109375, 0.3731842041015625, 0.39495849609375, 0.4167327880859375, 0.438507080078125, 0.4602813720703125, 0.4820556640625, 0.5038299560546875, 0.525604248046875, 0.5473785400390625, 0.56915283203125, 0.5909271240234375, 0.612701416015625, 0.6344757080078125, 0.65625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 13.0, 20.0, 29.0, 47.0, 75.0, 120.0, 177.0, 393.0, 665.0, 1332.0, 3130.0, 7939.0, 25500.0, 105094.0, 561318.0, 2164897.0, 1064791.0, 196278.0, 42061.0, 12177.0, 4377.0, 1919.0, 858.0, 413.0, 276.0, 168.0, 80.0, 52.0, 34.0, 20.0, 6.0, 11.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.9208984375, -1.86993408203125, -1.8189697265625, -1.76800537109375, -1.717041015625, -1.66607666015625, -1.6151123046875, -1.56414794921875, -1.51318359375, -1.46221923828125, -1.4112548828125, -1.36029052734375, -1.309326171875, -1.25836181640625, -1.2073974609375, -1.15643310546875, -1.10546875, -1.05450439453125, -1.0035400390625, -0.95257568359375, -0.901611328125, -0.85064697265625, -0.7996826171875, -0.74871826171875, -0.69775390625, -0.64678955078125, -0.5958251953125, -0.54486083984375, -0.493896484375, -0.44293212890625, -0.3919677734375, -0.34100341796875, -0.2900390625, -0.23907470703125, -0.1881103515625, -0.13714599609375, -0.086181640625, -0.03521728515625, 0.0157470703125, 0.06671142578125, 0.11767578125, 0.16864013671875, 0.2196044921875, 0.27056884765625, 0.321533203125, 0.37249755859375, 0.4234619140625, 0.47442626953125, 0.525390625, 0.57635498046875, 0.6273193359375, 0.67828369140625, 0.729248046875, 0.78021240234375, 0.8311767578125, 0.88214111328125, 0.93310546875, 0.98406982421875, 1.0350341796875, 1.08599853515625, 1.136962890625, 1.18792724609375, 1.2388916015625, 1.28985595703125, 1.3408203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 10.0, 20.0, 34.0, 28.0, 55.0, 87.0, 127.0, 183.0, 272.0, 371.0, 480.0, 518.0, 481.0, 392.0, 289.0, 215.0, 172.0, 98.0, 78.0, 50.0, 27.0, 21.0, 16.0, 7.0, 11.0, 5.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.35546875, -1.3114013671875, -1.267333984375, -1.2232666015625, -1.17919921875, -1.1351318359375, -1.091064453125, -1.0469970703125, -1.0029296875, -0.9588623046875, -0.914794921875, -0.8707275390625, -0.82666015625, -0.7825927734375, -0.738525390625, -0.6944580078125, -0.650390625, -0.6063232421875, -0.562255859375, -0.5181884765625, -0.47412109375, -0.4300537109375, -0.385986328125, -0.3419189453125, -0.2978515625, -0.2537841796875, -0.209716796875, -0.1656494140625, -0.12158203125, -0.0775146484375, -0.033447265625, 0.0106201171875, 0.0546875, 0.0987548828125, 0.142822265625, 0.1868896484375, 0.23095703125, 0.2750244140625, 0.319091796875, 0.3631591796875, 0.4072265625, 0.4512939453125, 0.495361328125, 0.5394287109375, 0.58349609375, 0.6275634765625, 0.671630859375, 0.7156982421875, 0.759765625, 0.8038330078125, 0.847900390625, 0.8919677734375, 0.93603515625, 0.9801025390625, 1.024169921875, 1.0682373046875, 1.1123046875, 1.1563720703125, 1.200439453125, 1.2445068359375, 1.28857421875, 1.3326416015625, 1.376708984375, 1.4207763671875, 1.46484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 9.0, 11.0, 13.0, 12.0, 31.0, 37.0, 57.0, 67.0, 77.0, 81.0, 86.0, 99.0, 63.0, 78.0, 76.0, 60.0, 50.0, 33.0, 21.0, 9.0, 12.0, 9.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0], "bins": [-9.641374588012695, -9.441437721252441, -9.241500854492188, -9.041563987731934, -8.84162712097168, -8.641690254211426, -8.441753387451172, -8.241816520690918, -8.041879653930664, -7.84194278717041, -7.642005920410156, -7.442069053649902, -7.242132186889648, -7.0421953201293945, -6.842258453369141, -6.642321586608887, -6.442384243011475, -6.242447376251221, -6.042510509490967, -5.842573642730713, -5.642636775970459, -5.442699909210205, -5.242762565612793, -5.042825698852539, -4.842888832092285, -4.642951965332031, -4.443015098571777, -4.243078231811523, -4.0431413650512695, -3.8432044982910156, -3.6432673931121826, -3.4433305263519287, -3.2433934211730957, -3.043456554412842, -2.843519687652588, -2.643582820892334, -2.44364595413208, -2.243709087371826, -2.043771982192993, -1.8438351154327393, -1.6438982486724854, -1.4439613819122314, -1.2440245151519775, -1.044087529182434, -0.8441506624221802, -0.6442137956619263, -0.4442768096923828, -0.2443399429321289, -0.044403076171875, 0.1555338203907013, 0.3554707169532776, 0.5554076433181763, 0.7553445100784302, 0.9552813768386841, 1.1552183628082275, 1.3551552295684814, 1.5550920963287354, 1.7550289630889893, 1.9549658298492432, 2.154902935028076, 2.35483980178833, 2.554776668548584, 2.754713535308838, 2.954650402069092, 3.1545872688293457]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 17.0, 6.0, 10.0, 16.0, 16.0, 15.0, 23.0, 19.0, 20.0, 24.0, 24.0, 24.0, 43.0, 41.0, 47.0, 32.0, 39.0, 36.0, 49.0, 40.0, 44.0, 41.0, 40.0, 37.0, 27.0, 40.0, 25.0, 21.0, 26.0, 25.0, 9.0, 19.0, 18.0, 19.0, 15.0, 9.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078807830810547, -3.948406219482422, -3.818004846572876, -3.687603235244751, -3.557201862335205, -3.42680025100708, -3.296398639678955, -3.165997266769409, -3.0355958938598633, -2.9051942825317383, -2.7747929096221924, -2.6443912982940674, -2.5139899253845215, -2.3835883140563965, -2.2531867027282715, -2.1227853298187256, -1.9923837184906006, -1.8619822263717651, -1.7315807342529297, -1.6011791229248047, -1.4707777500152588, -1.3403761386871338, -1.2099746465682983, -1.079573154449463, -0.9491716623306274, -0.818770170211792, -0.6883686780929565, -0.5579671263694763, -0.42756563425064087, -0.2971641421318054, -0.1667625904083252, -0.036361098289489746, 0.0940403938293457, 0.22444190084934235, 0.354843407869339, 0.4852449297904968, 0.6156464219093323, 0.7460479140281677, 0.876449465751648, 1.0068509578704834, 1.1372524499893188, 1.2676539421081543, 1.3980554342269897, 1.5284569263458252, 1.6588585376739502, 1.789259910583496, 1.919661521911621, 2.050063133239746, 2.180464506149292, 2.310866117477417, 2.441267490386963, 2.571669101715088, 2.702070474624634, 2.832472085952759, 2.9628734588623047, 3.0932750701904297, 3.2236766815185547, 3.3540782928466797, 3.4844796657562256, 3.6148812770843506, 3.7452826499938965, 3.8756842613220215, 4.0060858726501465, 4.136487007141113, 4.266888618469238]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 6.0, 7.0, 8.0, 25.0, 19.0, 39.0, 48.0, 66.0, 150.0, 255.0, 456.0, 708.0, 1421.0, 2677.0, 5227.0, 10159.0, 19055.0, 36468.0, 73039.0, 145273.0, 245780.0, 235437.0, 134180.0, 67015.0, 34065.0, 17529.0, 9078.0, 4741.0, 2541.0, 1342.0, 736.0, 385.0, 232.0, 147.0, 92.0, 51.0, 33.0, 18.0, 20.0, 8.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3142852783203125, -1.267242431640625, -1.2201995849609375, -1.17315673828125, -1.1261138916015625, -1.079071044921875, -1.0320281982421875, -0.9849853515625, -0.9379425048828125, -0.890899658203125, -0.8438568115234375, -0.79681396484375, -0.7497711181640625, -0.702728271484375, -0.6556854248046875, -0.608642578125, -0.5615997314453125, -0.514556884765625, -0.4675140380859375, -0.42047119140625, -0.3734283447265625, -0.326385498046875, -0.2793426513671875, -0.2322998046875, -0.1852569580078125, -0.138214111328125, -0.0911712646484375, -0.04412841796875, 0.0029144287109375, 0.049957275390625, 0.0970001220703125, 0.14404296875, 0.1910858154296875, 0.238128662109375, 0.2851715087890625, 0.33221435546875, 0.3792572021484375, 0.426300048828125, 0.4733428955078125, 0.5203857421875, 0.5674285888671875, 0.614471435546875, 0.6615142822265625, 0.70855712890625, 0.7555999755859375, 0.802642822265625, 0.8496856689453125, 0.896728515625, 0.9437713623046875, 0.990814208984375, 1.0378570556640625, 1.08489990234375, 1.1319427490234375, 1.178985595703125, 1.2260284423828125, 1.2730712890625, 1.3201141357421875, 1.367156982421875, 1.4141998291015625, 1.46124267578125, 1.5082855224609375, 1.555328369140625, 1.6023712158203125, 1.6494140625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 9.0, 23.0, 20.0, 21.0, 16.0, 25.0, 37.0, 35.0, 42.0, 49.0, 46.0, 36.0, 47.0, 48.0, 55.0, 62.0, 42.0, 55.0, 42.0, 34.0, 45.0, 29.0, 31.0, 24.0, 19.0, 18.0, 14.0, 10.0, 8.0, 7.0, 5.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7431640625, -0.722015380859375, -0.70086669921875, -0.679718017578125, -0.6585693359375, -0.637420654296875, -0.61627197265625, -0.595123291015625, -0.573974609375, -0.552825927734375, -0.53167724609375, -0.510528564453125, -0.4893798828125, -0.468231201171875, -0.44708251953125, -0.425933837890625, -0.40478515625, -0.383636474609375, -0.36248779296875, -0.341339111328125, -0.3201904296875, -0.299041748046875, -0.27789306640625, -0.256744384765625, -0.235595703125, -0.214447021484375, -0.19329833984375, -0.172149658203125, -0.1510009765625, -0.129852294921875, -0.10870361328125, -0.087554931640625, -0.06640625, -0.045257568359375, -0.02410888671875, -0.002960205078125, 0.0181884765625, 0.039337158203125, 0.06048583984375, 0.081634521484375, 0.102783203125, 0.123931884765625, 0.14508056640625, 0.166229248046875, 0.1873779296875, 0.208526611328125, 0.22967529296875, 0.250823974609375, 0.27197265625, 0.293121337890625, 0.31427001953125, 0.335418701171875, 0.3565673828125, 0.377716064453125, 0.39886474609375, 0.420013427734375, 0.441162109375, 0.462310791015625, 0.48345947265625, 0.504608154296875, 0.5257568359375, 0.546905517578125, 0.56805419921875, 0.589202880859375, 0.6103515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 9.0, 19.0, 26.0, 50.0, 72.0, 111.0, 208.0, 435.0, 965.0, 2222.0, 5457.0, 14068.0, 36125.0, 94437.0, 245040.0, 351909.0, 184751.0, 68870.0, 26096.0, 10447.0, 4108.0, 1647.0, 703.0, 340.0, 156.0, 106.0, 45.0, 32.0, 31.0, 16.0, 11.0, 7.0, 5.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.011810302734375, -1.94549560546875, -1.879180908203125, -1.8128662109375, -1.746551513671875, -1.68023681640625, -1.613922119140625, -1.547607421875, -1.481292724609375, -1.41497802734375, -1.348663330078125, -1.2823486328125, -1.216033935546875, -1.14971923828125, -1.083404541015625, -1.01708984375, -0.950775146484375, -0.88446044921875, -0.818145751953125, -0.7518310546875, -0.685516357421875, -0.61920166015625, -0.552886962890625, -0.486572265625, -0.420257568359375, -0.35394287109375, -0.287628173828125, -0.2213134765625, -0.154998779296875, -0.08868408203125, -0.022369384765625, 0.0439453125, 0.110260009765625, 0.17657470703125, 0.242889404296875, 0.3092041015625, 0.375518798828125, 0.44183349609375, 0.508148193359375, 0.574462890625, 0.640777587890625, 0.70709228515625, 0.773406982421875, 0.8397216796875, 0.906036376953125, 0.97235107421875, 1.038665771484375, 1.10498046875, 1.171295166015625, 1.23760986328125, 1.303924560546875, 1.3702392578125, 1.436553955078125, 1.50286865234375, 1.569183349609375, 1.635498046875, 1.701812744140625, 1.76812744140625, 1.834442138671875, 1.9007568359375, 1.967071533203125, 2.03338623046875, 2.099700927734375, 2.166015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 3.0, 10.0, 9.0, 13.0, 15.0, 11.0, 20.0, 28.0, 27.0, 40.0, 41.0, 51.0, 57.0, 41.0, 42.0, 47.0, 58.0, 45.0, 31.0, 47.0, 51.0, 43.0, 38.0, 38.0, 31.0, 27.0, 19.0, 27.0, 16.0, 14.0, 12.0, 11.0, 9.0, 3.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.638671875, -1.575653076171875, -1.51263427734375, -1.449615478515625, -1.3865966796875, -1.323577880859375, -1.26055908203125, -1.197540283203125, -1.134521484375, -1.071502685546875, -1.00848388671875, -0.945465087890625, -0.8824462890625, -0.819427490234375, -0.75640869140625, -0.693389892578125, -0.63037109375, -0.567352294921875, -0.50433349609375, -0.441314697265625, -0.3782958984375, -0.315277099609375, -0.25225830078125, -0.189239501953125, -0.126220703125, -0.063201904296875, -0.00018310546875, 0.062835693359375, 0.1258544921875, 0.188873291015625, 0.25189208984375, 0.314910888671875, 0.3779296875, 0.440948486328125, 0.50396728515625, 0.566986083984375, 0.6300048828125, 0.693023681640625, 0.75604248046875, 0.819061279296875, 0.882080078125, 0.945098876953125, 1.00811767578125, 1.071136474609375, 1.1341552734375, 1.197174072265625, 1.26019287109375, 1.323211669921875, 1.38623046875, 1.449249267578125, 1.51226806640625, 1.575286865234375, 1.6383056640625, 1.701324462890625, 1.76434326171875, 1.827362060546875, 1.890380859375, 1.953399658203125, 2.01641845703125, 2.079437255859375, 2.1424560546875, 2.205474853515625, 2.26849365234375, 2.331512451171875, 2.39453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 5.0, 13.0, 17.0, 30.0, 45.0, 62.0, 94.0, 153.0, 258.0, 390.0, 649.0, 1012.0, 1586.0, 2657.0, 4647.0, 8280.0, 15455.0, 29270.0, 55455.0, 104676.0, 180962.0, 229682.0, 184216.0, 106924.0, 56423.0, 29487.0, 15479.0, 8694.0, 4740.0, 2768.0, 1662.0, 951.0, 637.0, 417.0, 271.0, 159.0, 99.0, 78.0, 54.0, 38.0, 23.0, 9.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.677734375, -0.656890869140625, -0.63604736328125, -0.615203857421875, -0.5943603515625, -0.573516845703125, -0.55267333984375, -0.531829833984375, -0.510986328125, -0.490142822265625, -0.46929931640625, -0.448455810546875, -0.4276123046875, -0.406768798828125, -0.38592529296875, -0.365081787109375, -0.34423828125, -0.323394775390625, -0.30255126953125, -0.281707763671875, -0.2608642578125, -0.240020751953125, -0.21917724609375, -0.198333740234375, -0.177490234375, -0.156646728515625, -0.13580322265625, -0.114959716796875, -0.0941162109375, -0.073272705078125, -0.05242919921875, -0.031585693359375, -0.0107421875, 0.010101318359375, 0.03094482421875, 0.051788330078125, 0.0726318359375, 0.093475341796875, 0.11431884765625, 0.135162353515625, 0.156005859375, 0.176849365234375, 0.19769287109375, 0.218536376953125, 0.2393798828125, 0.260223388671875, 0.28106689453125, 0.301910400390625, 0.32275390625, 0.343597412109375, 0.36444091796875, 0.385284423828125, 0.4061279296875, 0.426971435546875, 0.44781494140625, 0.468658447265625, 0.489501953125, 0.510345458984375, 0.53118896484375, 0.552032470703125, 0.5728759765625, 0.593719482421875, 0.61456298828125, 0.635406494140625, 0.65625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 8.0, 8.0, 4.0, 7.0, 9.0, 20.0, 12.0, 22.0, 18.0, 28.0, 35.0, 40.0, 54.0, 61.0, 57.0, 97.0, 91.0, 71.0, 69.0, 63.0, 49.0, 34.0, 28.0, 20.0, 13.0, 12.0, 11.0, 10.0, 11.0, 11.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001990795135498047, -0.00019340217113494873, -0.00018772482872009277, -0.00018204748630523682, -0.00017637014389038086, -0.0001706928014755249, -0.00016501545906066895, -0.000159338116645813, -0.00015366077423095703, -0.00014798343181610107, -0.00014230608940124512, -0.00013662874698638916, -0.0001309514045715332, -0.00012527406215667725, -0.00011959671974182129, -0.00011391937732696533, -0.00010824203491210938, -0.00010256469249725342, -9.688735008239746e-05, -9.12100076675415e-05, -8.553266525268555e-05, -7.985532283782959e-05, -7.417798042297363e-05, -6.850063800811768e-05, -6.282329559326172e-05, -5.714595317840576e-05, -5.1468610763549805e-05, -4.579126834869385e-05, -4.011392593383789e-05, -3.4436583518981934e-05, -2.8759241104125977e-05, -2.308189868927002e-05, -1.7404556274414062e-05, -1.1727213859558105e-05, -6.0498714447021484e-06, -3.725290298461914e-07, 5.304813385009766e-06, 1.0982155799865723e-05, 1.665949821472168e-05, 2.2336840629577637e-05, 2.8014183044433594e-05, 3.369152545928955e-05, 3.936886787414551e-05, 4.5046210289001465e-05, 5.072355270385742e-05, 5.640089511871338e-05, 6.207823753356934e-05, 6.775557994842529e-05, 7.343292236328125e-05, 7.911026477813721e-05, 8.478760719299316e-05, 9.046494960784912e-05, 9.614229202270508e-05, 0.00010181963443756104, 0.00010749697685241699, 0.00011317431926727295, 0.0001188516616821289, 0.00012452900409698486, 0.00013020634651184082, 0.00013588368892669678, 0.00014156103134155273, 0.0001472383737564087, 0.00015291571617126465, 0.0001585930585861206, 0.00016427040100097656]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 12.0, 10.0, 16.0, 24.0, 36.0, 54.0, 76.0, 148.0, 247.0, 411.0, 685.0, 1287.0, 2263.0, 4327.0, 8347.0, 16775.0, 35347.0, 77042.0, 160526.0, 262753.0, 235182.0, 127876.0, 59515.0, 27758.0, 13382.0, 6636.0, 3462.0, 1843.0, 1029.0, 564.0, 343.0, 198.0, 127.0, 88.0, 60.0, 37.0, 21.0, 16.0, 6.0, 12.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.82763671875, -0.8038787841796875, -0.780120849609375, -0.7563629150390625, -0.73260498046875, -0.7088470458984375, -0.685089111328125, -0.6613311767578125, -0.6375732421875, -0.6138153076171875, -0.590057373046875, -0.5662994384765625, -0.54254150390625, -0.5187835693359375, -0.495025634765625, -0.4712677001953125, -0.447509765625, -0.4237518310546875, -0.399993896484375, -0.3762359619140625, -0.35247802734375, -0.3287200927734375, -0.304962158203125, -0.2812042236328125, -0.2574462890625, -0.2336883544921875, -0.209930419921875, -0.1861724853515625, -0.16241455078125, -0.1386566162109375, -0.114898681640625, -0.0911407470703125, -0.0673828125, -0.0436248779296875, -0.019866943359375, 0.0038909912109375, 0.02764892578125, 0.0514068603515625, 0.075164794921875, 0.0989227294921875, 0.1226806640625, 0.1464385986328125, 0.170196533203125, 0.1939544677734375, 0.21771240234375, 0.2414703369140625, 0.265228271484375, 0.2889862060546875, 0.312744140625, 0.3365020751953125, 0.360260009765625, 0.3840179443359375, 0.40777587890625, 0.4315338134765625, 0.455291748046875, 0.4790496826171875, 0.5028076171875, 0.5265655517578125, 0.550323486328125, 0.5740814208984375, 0.59783935546875, 0.6215972900390625, 0.645355224609375, 0.6691131591796875, 0.69287109375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 0.0, 2.0, 5.0, 6.0, 9.0, 14.0, 14.0, 17.0, 23.0, 26.0, 30.0, 40.0, 46.0, 74.0, 69.0, 91.0, 84.0, 75.0, 74.0, 51.0, 47.0, 46.0, 41.0, 24.0, 18.0, 20.0, 9.0, 8.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.8323593139648438, -0.8038787841796875, -0.7753982543945312, -0.746917724609375, -0.7184371948242188, -0.6899566650390625, -0.6614761352539062, -0.63299560546875, -0.6045150756835938, -0.5760345458984375, -0.5475540161132812, -0.519073486328125, -0.49059295654296875, -0.4621124267578125, -0.43363189697265625, -0.4051513671875, -0.37667083740234375, -0.3481903076171875, -0.31970977783203125, -0.291229248046875, -0.26274871826171875, -0.2342681884765625, -0.20578765869140625, -0.17730712890625, -0.14882659912109375, -0.1203460693359375, -0.09186553955078125, -0.063385009765625, -0.03490447998046875, -0.0064239501953125, 0.02205657958984375, 0.050537109375, 0.07901763916015625, 0.1074981689453125, 0.13597869873046875, 0.164459228515625, 0.19293975830078125, 0.2214202880859375, 0.24990081787109375, 0.27838134765625, 0.30686187744140625, 0.3353424072265625, 0.36382293701171875, 0.392303466796875, 0.42078399658203125, 0.4492645263671875, 0.47774505615234375, 0.5062255859375, 0.5347061157226562, 0.5631866455078125, 0.5916671752929688, 0.620147705078125, 0.6486282348632812, 0.6771087646484375, 0.7055892944335938, 0.73406982421875, 0.7625503540039062, 0.7910308837890625, 0.8195114135742188, 0.847991943359375, 0.8764724731445312, 0.9049530029296875, 0.9334335327148438, 0.9619140625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 31.0, 31.0, 46.0, 65.0, 73.0, 93.0, 104.0, 101.0, 90.0, 83.0, 72.0, 65.0, 46.0, 39.0, 20.0, 13.0, 9.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.832776069641113, -8.563865661621094, -8.294955253601074, -8.026044845581055, -7.757134437561035, -7.488224029541016, -7.219313621520996, -6.950403213500977, -6.681492805480957, -6.4125823974609375, -6.143671989440918, -5.874761581420898, -5.605851173400879, -5.336940765380859, -5.06803035736084, -4.79911994934082, -4.530209541320801, -4.261299133300781, -3.9923887252807617, -3.723478317260742, -3.4545679092407227, -3.185657501220703, -2.9167470932006836, -2.647836685180664, -2.3789262771606445, -2.110015869140625, -1.8411054611206055, -1.572195053100586, -1.3032846450805664, -1.0343742370605469, -0.7654638290405273, -0.4965534210205078, -0.2276439666748047, 0.041266441345214844, 0.3101768493652344, 0.5790872573852539, 0.8479976654052734, 1.116908073425293, 1.3858184814453125, 1.654728889465332, 1.9236392974853516, 2.192549705505371, 2.4614601135253906, 2.73037052154541, 2.9992809295654297, 3.268191337585449, 3.5371017456054688, 3.8060121536254883, 4.074922561645508, 4.343832969665527, 4.612743377685547, 4.881653785705566, 5.150564193725586, 5.4194746017456055, 5.688385009765625, 5.9572954177856445, 6.226205825805664, 6.495116233825684, 6.764026641845703, 7.032937049865723, 7.301847457885742, 7.570757865905762, 7.839668273925781, 8.1085786819458, 8.37748908996582]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 4.0, 8.0, 12.0, 8.0, 11.0, 14.0, 14.0, 16.0, 16.0, 26.0, 26.0, 24.0, 23.0, 37.0, 30.0, 35.0, 39.0, 33.0, 35.0, 44.0, 25.0, 33.0, 29.0, 40.0, 31.0, 42.0, 28.0, 34.0, 31.0, 27.0, 34.0, 23.0, 25.0, 16.0, 20.0, 22.0, 20.0, 12.0, 8.0, 11.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.624483108520508, -4.483680248260498, -4.342877388000488, -4.2020745277404785, -4.061271667480469, -3.920468807220459, -3.779665946960449, -3.6388630867004395, -3.4980602264404297, -3.35725736618042, -3.21645450592041, -3.0756516456604004, -2.9348487854003906, -2.794045925140381, -2.653243064880371, -2.5124402046203613, -2.3716371059417725, -2.2308342456817627, -2.090031385421753, -1.9492285251617432, -1.8084256649017334, -1.6676228046417236, -1.5268198251724243, -1.3860169649124146, -1.2452141046524048, -1.104411244392395, -0.9636083841323853, -0.8228054642677307, -0.682002604007721, -0.5411997437477112, -0.40039682388305664, -0.2595939636230469, -0.11879110336303711, 0.02201177179813385, 0.1628146469593048, 0.30361753702163696, 0.44442039728164673, 0.5852232575416565, 0.726026177406311, 0.8668290376663208, 1.0076318979263306, 1.1484347581863403, 1.28923761844635, 1.4300405979156494, 1.5708434581756592, 1.711646318435669, 1.8524491786956787, 1.9932520389556885, 2.1340548992156982, 2.274857759475708, 2.4156606197357178, 2.5564634799957275, 2.6972663402557373, 2.838069200515747, 2.978872299194336, 3.1196751594543457, 3.2604780197143555, 3.4012808799743652, 3.542083740234375, 3.6828866004943848, 3.8236894607543945, 3.9644923210144043, 4.105295181274414, 4.246098041534424, 4.386900901794434]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 10.0, 5.0, 8.0, 17.0, 33.0, 42.0, 56.0, 65.0, 121.0, 213.0, 351.0, 590.0, 1097.0, 2165.0, 4718.0, 10741.0, 27506.0, 76861.0, 242984.0, 896205.0, 1964504.0, 675976.0, 189423.0, 61480.0, 22367.0, 9102.0, 3796.0, 1763.0, 880.0, 481.0, 289.0, 143.0, 98.0, 65.0, 38.0, 32.0, 12.0, 15.0, 9.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3056640625, -1.2697906494140625, -1.233917236328125, -1.1980438232421875, -1.16217041015625, -1.1262969970703125, -1.090423583984375, -1.0545501708984375, -1.0186767578125, -0.9828033447265625, -0.946929931640625, -0.9110565185546875, -0.87518310546875, -0.8393096923828125, -0.803436279296875, -0.7675628662109375, -0.731689453125, -0.6958160400390625, -0.659942626953125, -0.6240692138671875, -0.58819580078125, -0.5523223876953125, -0.516448974609375, -0.4805755615234375, -0.4447021484375, -0.4088287353515625, -0.372955322265625, -0.3370819091796875, -0.30120849609375, -0.2653350830078125, -0.229461669921875, -0.1935882568359375, -0.15771484375, -0.1218414306640625, -0.085968017578125, -0.0500946044921875, -0.01422119140625, 0.0216522216796875, 0.057525634765625, 0.0933990478515625, 0.1292724609375, 0.1651458740234375, 0.201019287109375, 0.2368927001953125, 0.27276611328125, 0.3086395263671875, 0.344512939453125, 0.3803863525390625, 0.416259765625, 0.4521331787109375, 0.488006591796875, 0.5238800048828125, 0.55975341796875, 0.5956268310546875, 0.631500244140625, 0.6673736572265625, 0.7032470703125, 0.7391204833984375, 0.774993896484375, 0.8108673095703125, 0.84674072265625, 0.8826141357421875, 0.918487548828125, 0.9543609619140625, 0.990234375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 5.0, 20.0, 23.0, 23.0, 26.0, 22.0, 26.0, 26.0, 36.0, 34.0, 56.0, 48.0, 67.0, 44.0, 51.0, 44.0, 35.0, 46.0, 35.0, 50.0, 32.0, 36.0, 42.0, 22.0, 25.0, 18.0, 17.0, 12.0, 7.0, 8.0, 8.0, 8.0, 8.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.779296875, -0.7573776245117188, -0.7354583740234375, -0.7135391235351562, -0.691619873046875, -0.6697006225585938, -0.6477813720703125, -0.6258621215820312, -0.60394287109375, -0.5820236206054688, -0.5601043701171875, -0.5381851196289062, -0.516265869140625, -0.49434661865234375, -0.4724273681640625, -0.45050811767578125, -0.4285888671875, -0.40666961669921875, -0.3847503662109375, -0.36283111572265625, -0.340911865234375, -0.31899261474609375, -0.2970733642578125, -0.27515411376953125, -0.25323486328125, -0.23131561279296875, -0.2093963623046875, -0.18747711181640625, -0.165557861328125, -0.14363861083984375, -0.1217193603515625, -0.09980010986328125, -0.077880859375, -0.05596160888671875, -0.0340423583984375, -0.01212310791015625, 0.009796142578125, 0.03171539306640625, 0.0536346435546875, 0.07555389404296875, 0.09747314453125, 0.11939239501953125, 0.1413116455078125, 0.16323089599609375, 0.185150146484375, 0.20706939697265625, 0.2289886474609375, 0.25090789794921875, 0.2728271484375, 0.29474639892578125, 0.3166656494140625, 0.33858489990234375, 0.360504150390625, 0.38242340087890625, 0.4043426513671875, 0.42626190185546875, 0.44818115234375, 0.47010040283203125, 0.4920196533203125, 0.5139389038085938, 0.535858154296875, 0.5577774047851562, 0.5796966552734375, 0.6016159057617188, 0.62353515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 9.0, 7.0, 9.0, 12.0, 28.0, 36.0, 54.0, 91.0, 164.0, 273.0, 423.0, 817.0, 1598.0, 3523.0, 8442.0, 23320.0, 76251.0, 306394.0, 1383675.0, 1810855.0, 428071.0, 101657.0, 29933.0, 10397.0, 4131.0, 1925.0, 954.0, 518.0, 249.0, 162.0, 113.0, 52.0, 39.0, 36.0, 21.0, 13.0, 3.0, 9.0, 6.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7578125, -1.695281982421875, -1.63275146484375, -1.570220947265625, -1.5076904296875, -1.445159912109375, -1.38262939453125, -1.320098876953125, -1.257568359375, -1.195037841796875, -1.13250732421875, -1.069976806640625, -1.0074462890625, -0.944915771484375, -0.88238525390625, -0.819854736328125, -0.75732421875, -0.694793701171875, -0.63226318359375, -0.569732666015625, -0.5072021484375, -0.444671630859375, -0.38214111328125, -0.319610595703125, -0.257080078125, -0.194549560546875, -0.13201904296875, -0.069488525390625, -0.0069580078125, 0.055572509765625, 0.11810302734375, 0.180633544921875, 0.2431640625, 0.305694580078125, 0.36822509765625, 0.430755615234375, 0.4932861328125, 0.555816650390625, 0.61834716796875, 0.680877685546875, 0.743408203125, 0.805938720703125, 0.86846923828125, 0.930999755859375, 0.9935302734375, 1.056060791015625, 1.11859130859375, 1.181121826171875, 1.24365234375, 1.306182861328125, 1.36871337890625, 1.431243896484375, 1.4937744140625, 1.556304931640625, 1.61883544921875, 1.681365966796875, 1.743896484375, 1.806427001953125, 1.86895751953125, 1.931488037109375, 1.9940185546875, 2.056549072265625, 2.11907958984375, 2.181610107421875, 2.244140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 7.0, 8.0, 17.0, 19.0, 35.0, 51.0, 66.0, 84.0, 130.0, 222.0, 268.0, 377.0, 521.0, 619.0, 473.0, 346.0, 259.0, 186.0, 117.0, 89.0, 56.0, 38.0, 30.0, 19.0, 10.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.5093536376953125, -1.454254150390625, -1.3991546630859375, -1.34405517578125, -1.2889556884765625, -1.233856201171875, -1.1787567138671875, -1.1236572265625, -1.0685577392578125, -1.013458251953125, -0.9583587646484375, -0.90325927734375, -0.8481597900390625, -0.793060302734375, -0.7379608154296875, -0.682861328125, -0.6277618408203125, -0.572662353515625, -0.5175628662109375, -0.46246337890625, -0.4073638916015625, -0.352264404296875, -0.2971649169921875, -0.2420654296875, -0.1869659423828125, -0.131866455078125, -0.0767669677734375, -0.02166748046875, 0.0334320068359375, 0.088531494140625, 0.1436309814453125, 0.19873046875, 0.2538299560546875, 0.308929443359375, 0.3640289306640625, 0.41912841796875, 0.4742279052734375, 0.529327392578125, 0.5844268798828125, 0.6395263671875, 0.6946258544921875, 0.749725341796875, 0.8048248291015625, 0.85992431640625, 0.9150238037109375, 0.970123291015625, 1.0252227783203125, 1.080322265625, 1.1354217529296875, 1.190521240234375, 1.2456207275390625, 1.30072021484375, 1.3558197021484375, 1.410919189453125, 1.4660186767578125, 1.5211181640625, 1.5762176513671875, 1.631317138671875, 1.6864166259765625, 1.74151611328125, 1.7966156005859375, 1.851715087890625, 1.9068145751953125, 1.9619140625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 6.0, 20.0, 20.0, 29.0, 58.0, 69.0, 67.0, 89.0, 91.0, 114.0, 82.0, 80.0, 71.0, 68.0, 45.0, 24.0, 21.0, 14.0, 10.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5529046058654785, -7.2928547859191895, -7.032805442810059, -6.7727556228637695, -6.512706279754639, -6.25265645980835, -5.992607116699219, -5.73255729675293, -5.472507476806641, -5.212457656860352, -4.952408313751221, -4.692358493804932, -4.432309150695801, -4.172259330749512, -3.9122097492218018, -3.652160167694092, -3.392110824584961, -3.132061243057251, -2.872011661529541, -2.611961841583252, -2.351912498474121, -2.091862678527832, -1.831813097000122, -1.571763515472412, -1.3117139339447021, -1.0516643524169922, -0.7916147112846375, -0.5315650701522827, -0.27151548862457275, -0.011465907096862793, 0.24858379364013672, 0.5086333751678467, 0.7686834335327148, 1.0287330150604248, 1.2887825965881348, 1.5488322973251343, 1.8088818788528442, 2.0689315795898438, 2.3289811611175537, 2.5890307426452637, 2.8490803241729736, 3.1091299057006836, 3.3691794872283936, 3.6292290687561035, 3.8892788887023926, 4.149328231811523, 4.4093780517578125, 4.669427871704102, 4.929477214813232, 5.1895270347595215, 5.449576377868652, 5.709626197814941, 5.969675540924072, 6.229725360870361, 6.489774703979492, 6.749824523925781, 7.00987434387207, 7.269924163818359, 7.52997350692749, 7.790023326873779, 8.05007266998291, 8.3101224899292, 8.570172309875488, 8.830221176147461, 9.09027099609375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 7.0, 7.0, 10.0, 13.0, 8.0, 11.0, 16.0, 21.0, 30.0, 27.0, 32.0, 33.0, 40.0, 41.0, 38.0, 41.0, 44.0, 46.0, 39.0, 45.0, 50.0, 35.0, 39.0, 34.0, 42.0, 40.0, 41.0, 27.0, 17.0, 14.0, 17.0, 15.0, 16.0, 10.0, 12.0, 15.0, 4.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.416705131530762, -4.264392852783203, -4.112080097198486, -3.9597678184509277, -3.807455539703369, -3.6551430225372314, -3.5028305053710938, -3.350518226623535, -3.1982057094573975, -3.0458931922912598, -2.893580913543701, -2.7412683963775635, -2.588955879211426, -2.436643600463867, -2.2843310832977295, -2.132018566131592, -1.9797062873840332, -1.827393889427185, -1.675081491470337, -1.5227689743041992, -1.370456576347351, -1.218144178390503, -1.0658316612243652, -0.9135192632675171, -0.761206865310669, -0.6088944673538208, -0.4565820097923279, -0.30426958203315735, -0.15195715427398682, 0.0003552436828613281, 0.15266770124435425, 0.30498015880584717, 0.4572920799255371, 0.6096044778823853, 0.7619169354438782, 0.9142293930053711, 1.0665417909622192, 1.2188541889190674, 1.371166706085205, 1.5234791040420532, 1.6757915019989014, 1.8281038999557495, 1.9804162979125977, 2.1327288150787354, 2.285041332244873, 2.4373536109924316, 2.5896661281585693, 2.741978645324707, 2.8942909240722656, 3.0466034412384033, 3.198915719985962, 3.3512282371520996, 3.503540515899658, 3.655853033065796, 3.8081655502319336, 3.960477828979492, 4.112790107727051, 4.265102386474609, 4.417415142059326, 4.569727420806885, 4.722039699554443, 4.87435245513916, 5.026664733886719, 5.178977012634277, 5.331289768218994]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 8.0, 9.0, 12.0, 17.0, 24.0, 44.0, 70.0, 96.0, 192.0, 295.0, 494.0, 863.0, 1634.0, 2805.0, 5081.0, 9053.0, 16830.0, 30664.0, 58479.0, 122490.0, 240919.0, 264025.0, 146385.0, 69357.0, 35628.0, 19145.0, 10531.0, 5650.0, 3376.0, 1944.0, 995.0, 600.0, 334.0, 191.0, 126.0, 78.0, 34.0, 25.0, 19.0, 8.0, 8.0, 6.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5419921875, -1.499298095703125, -1.45660400390625, -1.413909912109375, -1.3712158203125, -1.328521728515625, -1.28582763671875, -1.243133544921875, -1.200439453125, -1.157745361328125, -1.11505126953125, -1.072357177734375, -1.0296630859375, -0.986968994140625, -0.94427490234375, -0.901580810546875, -0.85888671875, -0.816192626953125, -0.77349853515625, -0.730804443359375, -0.6881103515625, -0.645416259765625, -0.60272216796875, -0.560028076171875, -0.517333984375, -0.474639892578125, -0.43194580078125, -0.389251708984375, -0.3465576171875, -0.303863525390625, -0.26116943359375, -0.218475341796875, -0.17578125, -0.133087158203125, -0.09039306640625, -0.047698974609375, -0.0050048828125, 0.037689208984375, 0.08038330078125, 0.123077392578125, 0.165771484375, 0.208465576171875, 0.25115966796875, 0.293853759765625, 0.3365478515625, 0.379241943359375, 0.42193603515625, 0.464630126953125, 0.50732421875, 0.550018310546875, 0.59271240234375, 0.635406494140625, 0.6781005859375, 0.720794677734375, 0.76348876953125, 0.806182861328125, 0.848876953125, 0.891571044921875, 0.93426513671875, 0.976959228515625, 1.0196533203125, 1.062347412109375, 1.10504150390625, 1.147735595703125, 1.1904296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 10.0, 6.0, 12.0, 13.0, 18.0, 19.0, 23.0, 23.0, 23.0, 29.0, 30.0, 37.0, 39.0, 31.0, 37.0, 38.0, 52.0, 36.0, 44.0, 29.0, 38.0, 40.0, 42.0, 51.0, 29.0, 19.0, 24.0, 21.0, 23.0, 25.0, 18.0, 14.0, 15.0, 14.0, 10.0, 7.0, 12.0, 4.0, 5.0, 7.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.6455078125, -0.6254806518554688, -0.6054534912109375, -0.5854263305664062, -0.565399169921875, -0.5453720092773438, -0.5253448486328125, -0.5053176879882812, -0.48529052734375, -0.46526336669921875, -0.4452362060546875, -0.42520904541015625, -0.405181884765625, -0.38515472412109375, -0.3651275634765625, -0.34510040283203125, -0.3250732421875, -0.30504608154296875, -0.2850189208984375, -0.26499176025390625, -0.244964599609375, -0.22493743896484375, -0.2049102783203125, -0.18488311767578125, -0.16485595703125, -0.14482879638671875, -0.1248016357421875, -0.10477447509765625, -0.084747314453125, -0.06472015380859375, -0.0446929931640625, -0.02466583251953125, -0.004638671875, 0.01538848876953125, 0.0354156494140625, 0.05544281005859375, 0.075469970703125, 0.09549713134765625, 0.1155242919921875, 0.13555145263671875, 0.15557861328125, 0.17560577392578125, 0.1956329345703125, 0.21566009521484375, 0.235687255859375, 0.25571441650390625, 0.2757415771484375, 0.29576873779296875, 0.3157958984375, 0.33582305908203125, 0.3558502197265625, 0.37587738037109375, 0.395904541015625, 0.41593170166015625, 0.4359588623046875, 0.45598602294921875, 0.47601318359375, 0.49604034423828125, 0.5160675048828125, 0.5360946655273438, 0.556121826171875, 0.5761489868164062, 0.5961761474609375, 0.6162033081054688, 0.63623046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 5.0, 12.0, 7.0, 5.0, 7.0, 16.0, 21.0, 23.0, 29.0, 70.0, 84.0, 146.0, 227.0, 415.0, 750.0, 1350.0, 2531.0, 5091.0, 10971.0, 25082.0, 60259.0, 176589.0, 415399.0, 221698.0, 73074.0, 29547.0, 12840.0, 5958.0, 2906.0, 1460.0, 810.0, 490.0, 234.0, 157.0, 75.0, 53.0, 48.0, 23.0, 19.0, 20.0, 11.0, 9.0, 7.0, 4.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9541015625, -1.8880767822265625, -1.822052001953125, -1.7560272216796875, -1.69000244140625, -1.6239776611328125, -1.557952880859375, -1.4919281005859375, -1.4259033203125, -1.3598785400390625, -1.293853759765625, -1.2278289794921875, -1.16180419921875, -1.0957794189453125, -1.029754638671875, -0.9637298583984375, -0.897705078125, -0.8316802978515625, -0.765655517578125, -0.6996307373046875, -0.63360595703125, -0.5675811767578125, -0.501556396484375, -0.4355316162109375, -0.3695068359375, -0.3034820556640625, -0.237457275390625, -0.1714324951171875, -0.10540771484375, -0.0393829345703125, 0.026641845703125, 0.0926666259765625, 0.15869140625, 0.2247161865234375, 0.290740966796875, 0.3567657470703125, 0.42279052734375, 0.4888153076171875, 0.554840087890625, 0.6208648681640625, 0.6868896484375, 0.7529144287109375, 0.818939208984375, 0.8849639892578125, 0.95098876953125, 1.0170135498046875, 1.083038330078125, 1.1490631103515625, 1.215087890625, 1.2811126708984375, 1.347137451171875, 1.4131622314453125, 1.47918701171875, 1.5452117919921875, 1.611236572265625, 1.6772613525390625, 1.7432861328125, 1.8093109130859375, 1.875335693359375, 1.9413604736328125, 2.00738525390625, 2.0734100341796875, 2.139434814453125, 2.2054595947265625, 2.271484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 9.0, 12.0, 8.0, 11.0, 10.0, 21.0, 12.0, 21.0, 20.0, 22.0, 30.0, 37.0, 28.0, 40.0, 43.0, 60.0, 47.0, 43.0, 35.0, 60.0, 37.0, 43.0, 48.0, 37.0, 31.0, 37.0, 28.0, 23.0, 25.0, 11.0, 12.0, 13.0, 18.0, 5.0, 10.0, 4.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90234375, -1.835845947265625, -1.76934814453125, -1.702850341796875, -1.6363525390625, -1.569854736328125, -1.50335693359375, -1.436859130859375, -1.370361328125, -1.303863525390625, -1.23736572265625, -1.170867919921875, -1.1043701171875, -1.037872314453125, -0.97137451171875, -0.904876708984375, -0.83837890625, -0.771881103515625, -0.70538330078125, -0.638885498046875, -0.5723876953125, -0.505889892578125, -0.43939208984375, -0.372894287109375, -0.306396484375, -0.239898681640625, -0.17340087890625, -0.106903076171875, -0.0404052734375, 0.026092529296875, 0.09259033203125, 0.159088134765625, 0.2255859375, 0.292083740234375, 0.35858154296875, 0.425079345703125, 0.4915771484375, 0.558074951171875, 0.62457275390625, 0.691070556640625, 0.757568359375, 0.824066162109375, 0.89056396484375, 0.957061767578125, 1.0235595703125, 1.090057373046875, 1.15655517578125, 1.223052978515625, 1.28955078125, 1.356048583984375, 1.42254638671875, 1.489044189453125, 1.5555419921875, 1.622039794921875, 1.68853759765625, 1.755035400390625, 1.821533203125, 1.888031005859375, 1.95452880859375, 2.021026611328125, 2.0875244140625, 2.154022216796875, 2.22052001953125, 2.287017822265625, 2.353515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 15.0, 27.0, 17.0, 36.0, 41.0, 60.0, 88.0, 126.0, 198.0, 282.0, 396.0, 648.0, 930.0, 1341.0, 2256.0, 3525.0, 5546.0, 9251.0, 15338.0, 26170.0, 46559.0, 93054.0, 200505.0, 282363.0, 176256.0, 81606.0, 41472.0, 23672.0, 14067.0, 8349.0, 5222.0, 3169.0, 2089.0, 1313.0, 829.0, 560.0, 393.0, 250.0, 152.0, 105.0, 91.0, 70.0, 28.0, 20.0, 15.0, 21.0, 16.0, 7.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.7003097534179688, -0.6764984130859375, -0.6526870727539062, -0.628875732421875, -0.6050643920898438, -0.5812530517578125, -0.5574417114257812, -0.53363037109375, -0.5098190307617188, -0.4860076904296875, -0.46219635009765625, -0.438385009765625, -0.41457366943359375, -0.3907623291015625, -0.36695098876953125, -0.3431396484375, -0.31932830810546875, -0.2955169677734375, -0.27170562744140625, -0.247894287109375, -0.22408294677734375, -0.2002716064453125, -0.17646026611328125, -0.15264892578125, -0.12883758544921875, -0.1050262451171875, -0.08121490478515625, -0.057403564453125, -0.03359222412109375, -0.0097808837890625, 0.01403045654296875, 0.037841796875, 0.06165313720703125, 0.0854644775390625, 0.10927581787109375, 0.133087158203125, 0.15689849853515625, 0.1807098388671875, 0.20452117919921875, 0.22833251953125, 0.25214385986328125, 0.2759552001953125, 0.29976654052734375, 0.323577880859375, 0.34738922119140625, 0.3712005615234375, 0.39501190185546875, 0.4188232421875, 0.44263458251953125, 0.4664459228515625, 0.49025726318359375, 0.514068603515625, 0.5378799438476562, 0.5616912841796875, 0.5855026245117188, 0.60931396484375, 0.6331253051757812, 0.6569366455078125, 0.6807479858398438, 0.704559326171875, 0.7283706665039062, 0.7521820068359375, 0.7759933471679688, 0.7998046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 6.0, 6.0, 8.0, 4.0, 14.0, 13.0, 13.0, 17.0, 27.0, 39.0, 70.0, 68.0, 94.0, 120.0, 111.0, 94.0, 52.0, 44.0, 35.0, 27.0, 20.0, 18.0, 7.0, 15.0, 11.0, 7.0, 14.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002014636993408203, -0.00019466131925582886, -0.0001878589391708374, -0.00018105655908584595, -0.0001742541790008545, -0.00016745179891586304, -0.00016064941883087158, -0.00015384703874588013, -0.00014704465866088867, -0.00014024227857589722, -0.00013343989849090576, -0.0001266375184059143, -0.00011983513832092285, -0.0001130327582359314, -0.00010623037815093994, -9.942799806594849e-05, -9.262561798095703e-05, -8.582323789596558e-05, -7.902085781097412e-05, -7.221847772598267e-05, -6.541609764099121e-05, -5.8613717555999756e-05, -5.18113374710083e-05, -4.5008957386016846e-05, -3.820657730102539e-05, -3.1404197216033936e-05, -2.460181713104248e-05, -1.7799437046051025e-05, -1.099705696105957e-05, -4.194676876068115e-06, 2.60770320892334e-06, 9.410083293914795e-06, 1.621246337890625e-05, 2.3014843463897705e-05, 2.981722354888916e-05, 3.6619603633880615e-05, 4.342198371887207e-05, 5.0224363803863525e-05, 5.702674388885498e-05, 6.382912397384644e-05, 7.063150405883789e-05, 7.743388414382935e-05, 8.42362642288208e-05, 9.103864431381226e-05, 9.784102439880371e-05, 0.00010464340448379517, 0.00011144578456878662, 0.00011824816465377808, 0.00012505054473876953, 0.00013185292482376099, 0.00013865530490875244, 0.0001454576849937439, 0.00015226006507873535, 0.0001590624451637268, 0.00016586482524871826, 0.00017266720533370972, 0.00017946958541870117, 0.00018627196550369263, 0.00019307434558868408, 0.00019987672567367554, 0.000206679105758667, 0.00021348148584365845, 0.0002202838659286499, 0.00022708624601364136, 0.0002338886260986328]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 18.0, 12.0, 30.0, 47.0, 58.0, 79.0, 138.0, 168.0, 242.0, 402.0, 599.0, 1017.0, 1649.0, 2508.0, 4279.0, 7417.0, 13081.0, 23924.0, 45748.0, 94208.0, 215745.0, 302568.0, 173180.0, 75736.0, 37878.0, 20193.0, 11288.0, 6405.0, 3770.0, 2259.0, 1411.0, 876.0, 512.0, 388.0, 217.0, 150.0, 105.0, 78.0, 57.0, 29.0, 25.0, 12.0, 15.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.837890625, -0.812774658203125, -0.78765869140625, -0.762542724609375, -0.7374267578125, -0.712310791015625, -0.68719482421875, -0.662078857421875, -0.636962890625, -0.611846923828125, -0.58673095703125, -0.561614990234375, -0.5364990234375, -0.511383056640625, -0.48626708984375, -0.461151123046875, -0.43603515625, -0.410919189453125, -0.38580322265625, -0.360687255859375, -0.3355712890625, -0.310455322265625, -0.28533935546875, -0.260223388671875, -0.235107421875, -0.209991455078125, -0.18487548828125, -0.159759521484375, -0.1346435546875, -0.109527587890625, -0.08441162109375, -0.059295654296875, -0.0341796875, -0.009063720703125, 0.01605224609375, 0.041168212890625, 0.0662841796875, 0.091400146484375, 0.11651611328125, 0.141632080078125, 0.166748046875, 0.191864013671875, 0.21697998046875, 0.242095947265625, 0.2672119140625, 0.292327880859375, 0.31744384765625, 0.342559814453125, 0.36767578125, 0.392791748046875, 0.41790771484375, 0.443023681640625, 0.4681396484375, 0.493255615234375, 0.51837158203125, 0.543487548828125, 0.568603515625, 0.593719482421875, 0.61883544921875, 0.643951416015625, 0.6690673828125, 0.694183349609375, 0.71929931640625, 0.744415283203125, 0.76953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 7.0, 8.0, 9.0, 15.0, 20.0, 28.0, 30.0, 46.0, 47.0, 79.0, 85.0, 110.0, 99.0, 91.0, 67.0, 57.0, 30.0, 30.0, 26.0, 20.0, 24.0, 11.0, 13.0, 9.0, 2.0, 2.0, 3.0, 1.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9232864379882812, -0.8890533447265625, -0.8548202514648438, -0.820587158203125, -0.7863540649414062, -0.7521209716796875, -0.7178878784179688, -0.68365478515625, -0.6494216918945312, -0.6151885986328125, -0.5809555053710938, -0.546722412109375, -0.5124893188476562, -0.4782562255859375, -0.44402313232421875, -0.4097900390625, -0.37555694580078125, -0.3413238525390625, -0.30709075927734375, -0.272857666015625, -0.23862457275390625, -0.2043914794921875, -0.17015838623046875, -0.13592529296875, -0.10169219970703125, -0.0674591064453125, -0.03322601318359375, 0.001007080078125, 0.03524017333984375, 0.0694732666015625, 0.10370635986328125, 0.137939453125, 0.17217254638671875, 0.2064056396484375, 0.24063873291015625, 0.274871826171875, 0.30910491943359375, 0.3433380126953125, 0.37757110595703125, 0.41180419921875, 0.44603729248046875, 0.4802703857421875, 0.5145034790039062, 0.548736572265625, 0.5829696655273438, 0.6172027587890625, 0.6514358520507812, 0.6856689453125, 0.7199020385742188, 0.7541351318359375, 0.7883682250976562, 0.822601318359375, 0.8568344116210938, 0.8910675048828125, 0.9253005981445312, 0.95953369140625, 0.9937667846679688, 1.0279998779296875, 1.0622329711914062, 1.096466064453125, 1.1306991577148438, 1.1649322509765625, 1.1991653442382812, 1.2333984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 7.0, 7.0, 8.0, 4.0, 12.0, 18.0, 19.0, 30.0, 25.0, 29.0, 36.0, 36.0, 34.0, 33.0, 46.0, 50.0, 44.0, 50.0, 54.0, 42.0, 63.0, 53.0, 40.0, 36.0, 35.0, 21.0, 15.0, 27.0, 27.0, 10.0, 8.0, 11.0, 11.0, 7.0, 12.0, 4.0, 6.0, 5.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.08251953125, -4.935297966003418, -4.788075923919678, -4.6408538818359375, -4.4936323165893555, -4.346410751342773, -4.199188709259033, -4.051966667175293, -3.904745101928711, -3.75752329826355, -3.6103014945983887, -3.4630796909332275, -3.3158578872680664, -3.1686360836029053, -3.021414279937744, -2.874192476272583, -2.726970672607422, -2.5797488689422607, -2.4325270652770996, -2.2853052616119385, -2.1380834579467773, -1.9908616542816162, -1.843639850616455, -1.696418046951294, -1.5491962432861328, -1.4019744396209717, -1.2547526359558105, -1.1075308322906494, -0.9603090286254883, -0.8130872249603271, -0.665865421295166, -0.5186436176300049, -0.37142229080200195, -0.22420048713684082, -0.07697868347167969, 0.07024312019348145, 0.21746492385864258, 0.3646867275238037, 0.5119085311889648, 0.659130334854126, 0.8063521385192871, 0.9535739421844482, 1.1007957458496094, 1.2480175495147705, 1.3952393531799316, 1.5424611568450928, 1.689682960510254, 1.836904764175415, 1.9841265678405762, 2.1313483715057373, 2.2785701751708984, 2.4257919788360596, 2.5730137825012207, 2.720235586166382, 2.867457389831543, 3.014679193496704, 3.1619009971618652, 3.3091228008270264, 3.4563446044921875, 3.6035664081573486, 3.7507882118225098, 3.898010015487671, 4.045231819152832, 4.192453384399414, 4.339675426483154]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 8.0, 12.0, 6.0, 10.0, 13.0, 13.0, 20.0, 24.0, 23.0, 31.0, 21.0, 43.0, 49.0, 44.0, 38.0, 55.0, 40.0, 50.0, 36.0, 46.0, 32.0, 39.0, 34.0, 30.0, 26.0, 40.0, 26.0, 29.0, 20.0, 22.0, 24.0, 14.0, 19.0, 10.0, 9.0, 11.0, 10.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-5.955738067626953, -5.759530544281006, -5.5633225440979, -5.367115020751953, -5.170907020568848, -4.9746994972229, -4.778491973876953, -4.582283973693848, -4.386075973510742, -4.189868450164795, -3.9936604499816895, -3.797452926635742, -3.6012449264526367, -3.4050374031066895, -3.208829641342163, -3.0126218795776367, -2.8164143562316895, -2.620206594467163, -2.4239988327026367, -2.2277913093566895, -2.031583309173584, -1.8353756666183472, -1.6391680240631104, -1.442960262298584, -1.2467525005340576, -1.0505447387695312, -0.8543370366096497, -0.6581293344497681, -0.4619215726852417, -0.26571381092071533, -0.06950616836547852, 0.12670159339904785, 0.3229098320007324, 0.5191175937652588, 0.7153252959251404, 0.911532998085022, 1.1077407598495483, 1.3039485216140747, 1.5001561641693115, 1.696363925933838, 1.8925716876983643, 2.0887794494628906, 2.284987211227417, 2.4811949729919434, 2.6774024963378906, 2.873610496520996, 3.0698180198669434, 3.2660257816314697, 3.462233543395996, 3.6584413051605225, 3.854649066925049, 4.050856590270996, 4.247064590454102, 4.443272113800049, 4.639479637145996, 4.835687637329102, 5.031895637512207, 5.228103160858154, 5.42431116104126, 5.620518684387207, 5.8167266845703125, 6.01293420791626, 6.209141731262207, 6.4053497314453125, 6.60155725479126]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 12.0, 12.0, 18.0, 25.0, 39.0, 51.0, 78.0, 108.0, 159.0, 265.0, 394.0, 629.0, 1032.0, 1900.0, 3415.0, 6248.0, 12650.0, 25786.0, 55685.0, 129117.0, 329779.0, 1078785.0, 1739220.0, 488596.0, 178593.0, 74765.0, 33400.0, 15928.0, 7994.0, 4112.0, 2233.0, 1233.0, 777.0, 427.0, 292.0, 173.0, 101.0, 74.0, 56.0, 35.0, 27.0, 16.0, 13.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1796875, -1.144134521484375, -1.10858154296875, -1.073028564453125, -1.0374755859375, -1.001922607421875, -0.96636962890625, -0.930816650390625, -0.895263671875, -0.859710693359375, -0.82415771484375, -0.788604736328125, -0.7530517578125, -0.717498779296875, -0.68194580078125, -0.646392822265625, -0.61083984375, -0.575286865234375, -0.53973388671875, -0.504180908203125, -0.4686279296875, -0.433074951171875, -0.39752197265625, -0.361968994140625, -0.326416015625, -0.290863037109375, -0.25531005859375, -0.219757080078125, -0.1842041015625, -0.148651123046875, -0.11309814453125, -0.077545166015625, -0.0419921875, -0.006439208984375, 0.02911376953125, 0.064666748046875, 0.1002197265625, 0.135772705078125, 0.17132568359375, 0.206878662109375, 0.242431640625, 0.277984619140625, 0.31353759765625, 0.349090576171875, 0.3846435546875, 0.420196533203125, 0.45574951171875, 0.491302490234375, 0.52685546875, 0.562408447265625, 0.59796142578125, 0.633514404296875, 0.6690673828125, 0.704620361328125, 0.74017333984375, 0.775726318359375, 0.811279296875, 0.846832275390625, 0.88238525390625, 0.917938232421875, 0.9534912109375, 0.989044189453125, 1.02459716796875, 1.060150146484375, 1.095703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 2.0, 8.0, 7.0, 8.0, 9.0, 12.0, 13.0, 6.0, 24.0, 20.0, 24.0, 31.0, 29.0, 33.0, 37.0, 44.0, 41.0, 36.0, 37.0, 39.0, 56.0, 43.0, 52.0, 38.0, 33.0, 37.0, 29.0, 30.0, 24.0, 21.0, 17.0, 16.0, 22.0, 18.0, 19.0, 15.0, 13.0, 7.0, 14.0, 4.0, 5.0, 7.0, 9.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.80126953125, -0.7776947021484375, -0.754119873046875, -0.7305450439453125, -0.70697021484375, -0.6833953857421875, -0.659820556640625, -0.6362457275390625, -0.6126708984375, -0.5890960693359375, -0.565521240234375, -0.5419464111328125, -0.51837158203125, -0.4947967529296875, -0.471221923828125, -0.4476470947265625, -0.424072265625, -0.4004974365234375, -0.376922607421875, -0.3533477783203125, -0.32977294921875, -0.3061981201171875, -0.282623291015625, -0.2590484619140625, -0.2354736328125, -0.2118988037109375, -0.188323974609375, -0.1647491455078125, -0.14117431640625, -0.1175994873046875, -0.094024658203125, -0.0704498291015625, -0.046875, -0.0233001708984375, 0.000274658203125, 0.0238494873046875, 0.04742431640625, 0.0709991455078125, 0.094573974609375, 0.1181488037109375, 0.1417236328125, 0.1652984619140625, 0.188873291015625, 0.2124481201171875, 0.23602294921875, 0.2595977783203125, 0.283172607421875, 0.3067474365234375, 0.330322265625, 0.3538970947265625, 0.377471923828125, 0.4010467529296875, 0.42462158203125, 0.4481964111328125, 0.471771240234375, 0.4953460693359375, 0.5189208984375, 0.5424957275390625, 0.566070556640625, 0.5896453857421875, 0.61322021484375, 0.6367950439453125, 0.660369873046875, 0.6839447021484375, 0.70751953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 5.0, 6.0, 13.0, 17.0, 18.0, 34.0, 44.0, 83.0, 114.0, 185.0, 312.0, 618.0, 1036.0, 2231.0, 5060.0, 13811.0, 44613.0, 169206.0, 811434.0, 2380145.0, 582101.0, 128509.0, 34882.0, 11413.0, 4285.0, 1950.0, 944.0, 477.0, 260.0, 147.0, 102.0, 68.0, 40.0, 31.0, 24.0, 16.0, 11.0, 3.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.9140625, -2.824127197265625, -2.73419189453125, -2.644256591796875, -2.5543212890625, -2.464385986328125, -2.37445068359375, -2.284515380859375, -2.194580078125, -2.104644775390625, -2.01470947265625, -1.924774169921875, -1.8348388671875, -1.744903564453125, -1.65496826171875, -1.565032958984375, -1.47509765625, -1.385162353515625, -1.29522705078125, -1.205291748046875, -1.1153564453125, -1.025421142578125, -0.93548583984375, -0.845550537109375, -0.755615234375, -0.665679931640625, -0.57574462890625, -0.485809326171875, -0.3958740234375, -0.305938720703125, -0.21600341796875, -0.126068115234375, -0.0361328125, 0.053802490234375, 0.14373779296875, 0.233673095703125, 0.3236083984375, 0.413543701171875, 0.50347900390625, 0.593414306640625, 0.683349609375, 0.773284912109375, 0.86322021484375, 0.953155517578125, 1.0430908203125, 1.133026123046875, 1.22296142578125, 1.312896728515625, 1.40283203125, 1.492767333984375, 1.58270263671875, 1.672637939453125, 1.7625732421875, 1.852508544921875, 1.94244384765625, 2.032379150390625, 2.122314453125, 2.212249755859375, 2.30218505859375, 2.392120361328125, 2.4820556640625, 2.571990966796875, 2.66192626953125, 2.751861572265625, 2.841796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 13.0, 16.0, 36.0, 49.0, 97.0, 132.0, 245.0, 385.0, 643.0, 901.0, 594.0, 337.0, 218.0, 161.0, 80.0, 57.0, 32.0, 23.0, 16.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.365875244140625, -3.28057861328125, -3.195281982421875, -3.1099853515625, -3.024688720703125, -2.93939208984375, -2.854095458984375, -2.768798828125, -2.683502197265625, -2.59820556640625, -2.512908935546875, -2.4276123046875, -2.342315673828125, -2.25701904296875, -2.171722412109375, -2.08642578125, -2.001129150390625, -1.91583251953125, -1.830535888671875, -1.7452392578125, -1.659942626953125, -1.57464599609375, -1.489349365234375, -1.404052734375, -1.318756103515625, -1.23345947265625, -1.148162841796875, -1.0628662109375, -0.977569580078125, -0.89227294921875, -0.806976318359375, -0.7216796875, -0.636383056640625, -0.55108642578125, -0.465789794921875, -0.3804931640625, -0.295196533203125, -0.20989990234375, -0.124603271484375, -0.039306640625, 0.045989990234375, 0.13128662109375, 0.216583251953125, 0.3018798828125, 0.387176513671875, 0.47247314453125, 0.557769775390625, 0.64306640625, 0.728363037109375, 0.81365966796875, 0.898956298828125, 0.9842529296875, 1.069549560546875, 1.15484619140625, 1.240142822265625, 1.325439453125, 1.410736083984375, 1.49603271484375, 1.581329345703125, 1.6666259765625, 1.751922607421875, 1.83721923828125, 1.922515869140625, 2.0078125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 5.0, 18.0, 34.0, 48.0, 82.0, 114.0, 129.0, 146.0, 126.0, 119.0, 76.0, 45.0, 31.0, 15.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.349769592285156, -7.915297031402588, -7.4808244705200195, -7.046351432800293, -6.611879348754883, -6.177406311035156, -5.742933750152588, -5.3084611892700195, -4.873988628387451, -4.439516067504883, -4.0050435066223145, -3.570570707321167, -3.1360981464385986, -2.7016255855560303, -2.267152786254883, -1.8326802253723145, -1.398207664489746, -0.963735044002533, -0.5292624235153198, -0.09478974342346191, 0.33968281745910645, 0.7741553783416748, 1.2086281776428223, 1.6431007385253906, 2.077573299407959, 2.5120458602905273, 2.9465184211730957, 3.380991220474243, 3.8154637813568115, 4.249936103820801, 4.684409141540527, 5.118881702423096, 5.553354263305664, 5.987826824188232, 6.422299385070801, 6.856772422790527, 7.2912445068359375, 7.725717544555664, 8.16019058227539, 8.5946626663208, 9.029134750366211, 9.463607788085938, 9.898079872131348, 10.332552909851074, 10.767024993896484, 11.201498031616211, 11.635971069335938, 12.070443153381348, 12.504916191101074, 12.9393892288208, 13.373861312866211, 13.808334350585938, 14.242806434631348, 14.677279472351074, 15.111751556396484, 15.546224594116211, 15.980697631835938, 16.415170669555664, 16.84964370727539, 17.284114837646484, 17.71858787536621, 18.153060913085938, 18.587533950805664, 19.02200698852539, 19.456478118896484]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 5.0, 3.0, 8.0, 12.0, 13.0, 22.0, 17.0, 19.0, 26.0, 19.0, 19.0, 34.0, 34.0, 40.0, 37.0, 25.0, 41.0, 35.0, 42.0, 27.0, 26.0, 42.0, 38.0, 33.0, 40.0, 38.0, 36.0, 33.0, 16.0, 30.0, 22.0, 28.0, 17.0, 18.0, 10.0, 18.0, 10.0, 9.0, 10.0, 8.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.363385200500488, -5.187209129333496, -5.011033058166504, -4.834856986999512, -4.658681392669678, -4.4825053215026855, -4.306329250335693, -4.130153179168701, -3.953977108001709, -3.777801036834717, -3.6016252040863037, -3.4254491329193115, -3.2492730617523193, -3.0730972290039062, -2.896921157836914, -2.720745086669922, -2.544569253921509, -2.3683931827545166, -2.1922173500061035, -2.0160412788391113, -1.8398652076721191, -1.6636892557144165, -1.4875133037567139, -1.3113372325897217, -1.135161280632019, -0.9589852690696716, -0.7828092575073242, -0.6066333055496216, -0.43045729398727417, -0.25428128242492676, -0.07810533046722412, 0.09807074069976807, 0.2742466926574707, 0.4504227042198181, 0.6265987157821655, 0.8027746677398682, 0.9789506793022156, 1.155126690864563, 1.3313026428222656, 1.5074787139892578, 1.6836546659469604, 1.859830617904663, 2.0360066890716553, 2.2121825218200684, 2.3883585929870605, 2.5645346641540527, 2.740710735321045, 2.916886806488037, 3.09306263923645, 3.2692387104034424, 3.4454145431518555, 3.6215906143188477, 3.79776668548584, 3.973942756652832, 4.150118827819824, 4.326294898986816, 4.50247049331665, 4.678646564483643, 4.854822635650635, 5.030998229980469, 5.207174301147461, 5.383350372314453, 5.559526443481445, 5.7357025146484375, 5.91187858581543]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 2.0, 6.0, 8.0, 15.0, 20.0, 37.0, 59.0, 94.0, 116.0, 206.0, 311.0, 500.0, 721.0, 1234.0, 1834.0, 2821.0, 4301.0, 6617.0, 10311.0, 15708.0, 24291.0, 38163.0, 65009.0, 126281.0, 234239.0, 227729.0, 120356.0, 62901.0, 37511.0, 23491.0, 15132.0, 9985.0, 6582.0, 4190.0, 2789.0, 1768.0, 1148.0, 730.0, 471.0, 315.0, 195.0, 150.0, 68.0, 52.0, 34.0, 20.0, 14.0, 10.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.134033203125, -1.09619140625, -1.058349609375, -1.0205078125, -0.982666015625, -0.94482421875, -0.906982421875, -0.869140625, -0.831298828125, -0.79345703125, -0.755615234375, -0.7177734375, -0.679931640625, -0.64208984375, -0.604248046875, -0.56640625, -0.528564453125, -0.49072265625, -0.452880859375, -0.4150390625, -0.377197265625, -0.33935546875, -0.301513671875, -0.263671875, -0.225830078125, -0.18798828125, -0.150146484375, -0.1123046875, -0.074462890625, -0.03662109375, 0.001220703125, 0.0390625, 0.076904296875, 0.11474609375, 0.152587890625, 0.1904296875, 0.228271484375, 0.26611328125, 0.303955078125, 0.341796875, 0.379638671875, 0.41748046875, 0.455322265625, 0.4931640625, 0.531005859375, 0.56884765625, 0.606689453125, 0.64453125, 0.682373046875, 0.72021484375, 0.758056640625, 0.7958984375, 0.833740234375, 0.87158203125, 0.909423828125, 0.947265625, 0.985107421875, 1.02294921875, 1.060791015625, 1.0986328125, 1.136474609375, 1.17431640625, 1.212158203125, 1.25]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 10.0, 11.0, 16.0, 9.0, 20.0, 23.0, 29.0, 27.0, 38.0, 35.0, 28.0, 58.0, 50.0, 48.0, 43.0, 47.0, 51.0, 34.0, 47.0, 52.0, 43.0, 36.0, 38.0, 32.0, 31.0, 29.0, 11.0, 16.0, 12.0, 14.0, 11.0, 12.0, 10.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0517578125, -1.0201187133789062, -0.9884796142578125, -0.9568405151367188, -0.925201416015625, -0.8935623168945312, -0.8619232177734375, -0.8302841186523438, -0.79864501953125, -0.7670059204101562, -0.7353668212890625, -0.7037277221679688, -0.672088623046875, -0.6404495239257812, -0.6088104248046875, -0.5771713256835938, -0.5455322265625, -0.5138931274414062, -0.4822540283203125, -0.45061492919921875, -0.418975830078125, -0.38733673095703125, -0.3556976318359375, -0.32405853271484375, -0.29241943359375, -0.26078033447265625, -0.2291412353515625, -0.19750213623046875, -0.165863037109375, -0.13422393798828125, -0.1025848388671875, -0.07094573974609375, -0.039306640625, -0.00766754150390625, 0.0239715576171875, 0.05561065673828125, 0.087249755859375, 0.11888885498046875, 0.1505279541015625, 0.18216705322265625, 0.21380615234375, 0.24544525146484375, 0.2770843505859375, 0.30872344970703125, 0.340362548828125, 0.37200164794921875, 0.4036407470703125, 0.43527984619140625, 0.4669189453125, 0.49855804443359375, 0.5301971435546875, 0.5618362426757812, 0.593475341796875, 0.6251144409179688, 0.6567535400390625, 0.6883926391601562, 0.72003173828125, 0.7516708374023438, 0.7833099365234375, 0.8149490356445312, 0.846588134765625, 0.8782272338867188, 0.9098663330078125, 0.9415054321289062, 0.97314453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 6.0, 6.0, 13.0, 11.0, 7.0, 11.0, 22.0, 34.0, 46.0, 76.0, 115.0, 213.0, 499.0, 1183.0, 3483.0, 10612.0, 31860.0, 105588.0, 510672.0, 289170.0, 63590.0, 20399.0, 6853.0, 2375.0, 876.0, 357.0, 152.0, 100.0, 46.0, 49.0, 16.0, 22.0, 15.0, 11.0, 20.0, 8.0, 11.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.40655517578125, -3.2994384765625, -3.19232177734375, -3.085205078125, -2.97808837890625, -2.8709716796875, -2.76385498046875, -2.65673828125, -2.54962158203125, -2.4425048828125, -2.33538818359375, -2.228271484375, -2.12115478515625, -2.0140380859375, -1.90692138671875, -1.7998046875, -1.69268798828125, -1.5855712890625, -1.47845458984375, -1.371337890625, -1.26422119140625, -1.1571044921875, -1.04998779296875, -0.94287109375, -0.83575439453125, -0.7286376953125, -0.62152099609375, -0.514404296875, -0.40728759765625, -0.3001708984375, -0.19305419921875, -0.0859375, 0.02117919921875, 0.1282958984375, 0.23541259765625, 0.342529296875, 0.44964599609375, 0.5567626953125, 0.66387939453125, 0.77099609375, 0.87811279296875, 0.9852294921875, 1.09234619140625, 1.199462890625, 1.30657958984375, 1.4136962890625, 1.52081298828125, 1.6279296875, 1.73504638671875, 1.8421630859375, 1.94927978515625, 2.056396484375, 2.16351318359375, 2.2706298828125, 2.37774658203125, 2.48486328125, 2.59197998046875, 2.6990966796875, 2.80621337890625, 2.913330078125, 3.02044677734375, 3.1275634765625, 3.23468017578125, 3.341796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 4.0, 2.0, 8.0, 11.0, 7.0, 16.0, 11.0, 11.0, 22.0, 14.0, 22.0, 29.0, 23.0, 35.0, 39.0, 25.0, 46.0, 37.0, 38.0, 48.0, 45.0, 45.0, 49.0, 38.0, 41.0, 40.0, 33.0, 38.0, 26.0, 32.0, 27.0, 21.0, 24.0, 26.0, 15.0, 9.0, 9.0, 13.0, 5.0, 2.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.267578125, -3.17962646484375, -3.0916748046875, -3.00372314453125, -2.915771484375, -2.82781982421875, -2.7398681640625, -2.65191650390625, -2.56396484375, -2.47601318359375, -2.3880615234375, -2.30010986328125, -2.212158203125, -2.12420654296875, -2.0362548828125, -1.94830322265625, -1.8603515625, -1.77239990234375, -1.6844482421875, -1.59649658203125, -1.508544921875, -1.42059326171875, -1.3326416015625, -1.24468994140625, -1.15673828125, -1.06878662109375, -0.9808349609375, -0.89288330078125, -0.804931640625, -0.71697998046875, -0.6290283203125, -0.54107666015625, -0.453125, -0.36517333984375, -0.2772216796875, -0.18927001953125, -0.101318359375, -0.01336669921875, 0.0745849609375, 0.16253662109375, 0.25048828125, 0.33843994140625, 0.4263916015625, 0.51434326171875, 0.602294921875, 0.69024658203125, 0.7781982421875, 0.86614990234375, 0.9541015625, 1.04205322265625, 1.1300048828125, 1.21795654296875, 1.305908203125, 1.39385986328125, 1.4818115234375, 1.56976318359375, 1.65771484375, 1.74566650390625, 1.8336181640625, 1.92156982421875, 2.009521484375, 2.09747314453125, 2.1854248046875, 2.27337646484375, 2.361328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 5.0, 14.0, 18.0, 18.0, 20.0, 26.0, 48.0, 64.0, 76.0, 114.0, 192.0, 302.0, 530.0, 853.0, 1431.0, 2591.0, 4442.0, 7370.0, 12482.0, 21847.0, 43741.0, 110473.0, 327728.0, 314876.0, 105882.0, 42130.0, 21433.0, 12162.0, 7279.0, 4240.0, 2466.0, 1401.0, 860.0, 524.0, 304.0, 188.0, 112.0, 91.0, 72.0, 28.0, 36.0, 24.0, 18.0, 6.0, 10.0, 8.0, 4.0, 8.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0205078125, -0.9875640869140625, -0.954620361328125, -0.9216766357421875, -0.88873291015625, -0.8557891845703125, -0.822845458984375, -0.7899017333984375, -0.7569580078125, -0.7240142822265625, -0.691070556640625, -0.6581268310546875, -0.62518310546875, -0.5922393798828125, -0.559295654296875, -0.5263519287109375, -0.493408203125, -0.4604644775390625, -0.427520751953125, -0.3945770263671875, -0.36163330078125, -0.3286895751953125, -0.295745849609375, -0.2628021240234375, -0.2298583984375, -0.1969146728515625, -0.163970947265625, -0.1310272216796875, -0.09808349609375, -0.0651397705078125, -0.032196044921875, 0.0007476806640625, 0.03369140625, 0.0666351318359375, 0.099578857421875, 0.1325225830078125, 0.16546630859375, 0.1984100341796875, 0.231353759765625, 0.2642974853515625, 0.2972412109375, 0.3301849365234375, 0.363128662109375, 0.3960723876953125, 0.42901611328125, 0.4619598388671875, 0.494903564453125, 0.5278472900390625, 0.560791015625, 0.5937347412109375, 0.626678466796875, 0.6596221923828125, 0.69256591796875, 0.7255096435546875, 0.758453369140625, 0.7913970947265625, 0.8243408203125, 0.8572845458984375, 0.890228271484375, 0.9231719970703125, 0.95611572265625, 0.9890594482421875, 1.022003173828125, 1.0549468994140625, 1.087890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 8.0, 3.0, 5.0, 7.0, 12.0, 18.0, 21.0, 22.0, 37.0, 64.0, 93.0, 143.0, 162.0, 119.0, 81.0, 59.0, 36.0, 25.0, 17.0, 11.0, 10.0, 8.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002486705780029297, -0.00023988261818885803, -0.00023109465837478638, -0.00022230669856071472, -0.00021351873874664307, -0.0002047307789325714, -0.00019594281911849976, -0.0001871548593044281, -0.00017836689949035645, -0.0001695789396762848, -0.00016079097986221313, -0.00015200302004814148, -0.00014321506023406982, -0.00013442710041999817, -0.00012563914060592651, -0.00011685118079185486, -0.0001080632209777832, -9.927526116371155e-05, -9.048730134963989e-05, -8.169934153556824e-05, -7.291138172149658e-05, -6.412342190742493e-05, -5.533546209335327e-05, -4.6547502279281616e-05, -3.775954246520996e-05, -2.8971582651138306e-05, -2.018362283706665e-05, -1.1395663022994995e-05, -2.60770320892334e-06, 6.1802566051483154e-06, 1.496821641921997e-05, 2.3756176233291626e-05, 3.254413604736328e-05, 4.1332095861434937e-05, 5.012005567550659e-05, 5.890801548957825e-05, 6.76959753036499e-05, 7.648393511772156e-05, 8.527189493179321e-05, 9.405985474586487e-05, 0.00010284781455993652, 0.00011163577437400818, 0.00012042373418807983, 0.0001292116940021515, 0.00013799965381622314, 0.0001467876136302948, 0.00015557557344436646, 0.0001643635332584381, 0.00017315149307250977, 0.00018193945288658142, 0.00019072741270065308, 0.00019951537251472473, 0.0002083033323287964, 0.00021709129214286804, 0.0002258792519569397, 0.00023466721177101135, 0.000243455171585083, 0.00025224313139915466, 0.0002610310912132263, 0.000269819051027298, 0.00027860701084136963, 0.0002873949706554413, 0.00029618293046951294, 0.0003049708902835846, 0.00031375885009765625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 9.0, 6.0, 8.0, 12.0, 22.0, 26.0, 48.0, 68.0, 86.0, 157.0, 285.0, 510.0, 845.0, 1571.0, 2789.0, 4983.0, 9048.0, 16583.0, 32186.0, 72889.0, 204888.0, 402428.0, 172394.0, 63951.0, 29087.0, 15063.0, 8231.0, 4460.0, 2517.0, 1480.0, 806.0, 450.0, 252.0, 154.0, 97.0, 56.0, 34.0, 29.0, 20.0, 15.0, 6.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9482421875, -0.916015625, -0.8837890625, -0.8515625, -0.8193359375, -0.787109375, -0.7548828125, -0.72265625, -0.6904296875, -0.658203125, -0.6259765625, -0.59375, -0.5615234375, -0.529296875, -0.4970703125, -0.46484375, -0.4326171875, -0.400390625, -0.3681640625, -0.3359375, -0.3037109375, -0.271484375, -0.2392578125, -0.20703125, -0.1748046875, -0.142578125, -0.1103515625, -0.078125, -0.0458984375, -0.013671875, 0.0185546875, 0.05078125, 0.0830078125, 0.115234375, 0.1474609375, 0.1796875, 0.2119140625, 0.244140625, 0.2763671875, 0.30859375, 0.3408203125, 0.373046875, 0.4052734375, 0.4375, 0.4697265625, 0.501953125, 0.5341796875, 0.56640625, 0.5986328125, 0.630859375, 0.6630859375, 0.6953125, 0.7275390625, 0.759765625, 0.7919921875, 0.82421875, 0.8564453125, 0.888671875, 0.9208984375, 0.953125, 0.9853515625, 1.017578125, 1.0498046875, 1.08203125, 1.1142578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 6.0, 7.0, 13.0, 12.0, 21.0, 28.0, 42.0, 47.0, 96.0, 115.0, 150.0, 129.0, 93.0, 59.0, 46.0, 38.0, 15.0, 17.0, 10.0, 8.0, 7.0, 2.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.77734375, -1.7288665771484375, -1.680389404296875, -1.6319122314453125, -1.58343505859375, -1.5349578857421875, -1.486480712890625, -1.4380035400390625, -1.3895263671875, -1.3410491943359375, -1.292572021484375, -1.2440948486328125, -1.19561767578125, -1.1471405029296875, -1.098663330078125, -1.0501861572265625, -1.001708984375, -0.9532318115234375, -0.904754638671875, -0.8562774658203125, -0.80780029296875, -0.7593231201171875, -0.710845947265625, -0.6623687744140625, -0.6138916015625, -0.5654144287109375, -0.516937255859375, -0.4684600830078125, -0.41998291015625, -0.3715057373046875, -0.323028564453125, -0.2745513916015625, -0.22607421875, -0.1775970458984375, -0.129119873046875, -0.0806427001953125, -0.03216552734375, 0.0163116455078125, 0.064788818359375, 0.1132659912109375, 0.1617431640625, 0.2102203369140625, 0.258697509765625, 0.3071746826171875, 0.35565185546875, 0.4041290283203125, 0.452606201171875, 0.5010833740234375, 0.549560546875, 0.5980377197265625, 0.646514892578125, 0.6949920654296875, 0.74346923828125, 0.7919464111328125, 0.840423583984375, 0.8889007568359375, 0.9373779296875, 0.9858551025390625, 1.034332275390625, 1.0828094482421875, 1.13128662109375, 1.1797637939453125, 1.228240966796875, 1.2767181396484375, 1.3251953125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 35.0, 292.0, 561.0, 122.0, 6.0, 2.0], "bins": [-136.30062866210938, -134.04249572753906, -131.78436279296875, -129.5262451171875, -127.26811218261719, -125.00997924804688, -122.7518539428711, -120.49372863769531, -118.235595703125, -115.97746276855469, -113.7193374633789, -111.46121215820312, -109.20307922363281, -106.9449462890625, -104.68682098388672, -102.42869567871094, -100.17056274414062, -97.91242980957031, -95.65430450439453, -93.39617919921875, -91.13804626464844, -88.87991333007812, -86.62178802490234, -84.36366271972656, -82.10552978515625, -79.84739685058594, -77.58927154541016, -75.33114624023438, -73.07301330566406, -70.81488037109375, -68.55675506591797, -66.29862976074219, -64.04049682617188, -61.78236770629883, -59.52423858642578, -57.266109466552734, -55.00798034667969, -52.74985122680664, -50.491722106933594, -48.23359298706055, -45.975467681884766, -43.71733856201172, -41.45920944213867, -39.201080322265625, -36.94295120239258, -34.68482208251953, -32.426692962646484, -30.168563842773438, -27.91043472290039, -25.652305603027344, -23.394176483154297, -21.13604736328125, -18.877918243408203, -16.619789123535156, -14.36166000366211, -12.103530883789062, -9.845401763916016, -7.587272644042969, -5.329143524169922, -3.071014404296875, -0.8128852844238281, 1.4452438354492188, 3.7033729553222656, 5.9615020751953125, 8.21963119506836]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 6.0, 6.0, 4.0, 3.0, 10.0, 11.0, 7.0, 13.0, 15.0, 13.0, 23.0, 19.0, 34.0, 38.0, 34.0, 41.0, 43.0, 35.0, 57.0, 45.0, 50.0, 47.0, 41.0, 40.0, 40.0, 42.0, 44.0, 25.0, 32.0, 30.0, 33.0, 24.0, 12.0, 19.0, 11.0, 13.0, 7.0, 4.0, 6.0, 3.0, 10.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.796760559082031, -8.49354362487793, -8.190325736999512, -7.88710880279541, -7.58389139175415, -7.280673980712891, -6.977457046508789, -6.674239635467529, -6.3710222244262695, -6.06780481338501, -5.76458740234375, -5.461370468139648, -5.158153057098389, -4.854935646057129, -4.551718711853027, -4.248501300811768, -3.945283889770508, -3.642066478729248, -3.3388493061065674, -3.0356321334838867, -2.732414722442627, -2.429197311401367, -2.1259801387786865, -1.8227629661560059, -1.519545555114746, -1.2163282632827759, -0.9131109714508057, -0.6098936796188354, -0.30667638778686523, -0.0034590959548950195, 0.2997581958770752, 0.6029753684997559, 0.9061927795410156, 1.2094100713729858, 1.512627363204956, 1.8158446550369263, 2.1190619468688965, 2.4222793579101562, 2.725496530532837, 3.0287137031555176, 3.3319311141967773, 3.635148525238037, 3.9383656978607178, 4.241582870483398, 4.544800281524658, 4.848017692565918, 5.1512346267700195, 5.454452037811279, 5.757669448852539, 6.060886859893799, 6.364104270935059, 6.66732120513916, 6.97053861618042, 7.27375602722168, 7.576972961425781, 7.880190372467041, 8.1834077835083, 8.486624717712402, 8.78984260559082, 9.093059539794922, 9.396276473999023, 9.699494361877441, 10.002711296081543, 10.305929183959961, 10.609146118164062]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 16.0, 9.0, 22.0, 16.0, 25.0, 35.0, 44.0, 58.0, 95.0, 142.0, 208.0, 341.0, 487.0, 846.0, 1272.0, 2099.0, 3503.0, 6153.0, 10807.0, 20095.0, 37815.0, 74923.0, 158507.0, 377364.0, 1364563.0, 1430068.0, 380894.0, 161200.0, 76448.0, 38372.0, 20544.0, 11361.0, 6391.0, 3680.0, 2206.0, 1323.0, 808.0, 508.0, 294.0, 205.0, 158.0, 113.0, 81.0, 62.0, 30.0, 23.0, 22.0, 16.0, 12.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.2119140625, -1.1740570068359375, -1.136199951171875, -1.0983428955078125, -1.06048583984375, -1.0226287841796875, -0.984771728515625, -0.9469146728515625, -0.9090576171875, -0.8712005615234375, -0.833343505859375, -0.7954864501953125, -0.75762939453125, -0.7197723388671875, -0.681915283203125, -0.6440582275390625, -0.606201171875, -0.5683441162109375, -0.530487060546875, -0.4926300048828125, -0.45477294921875, -0.4169158935546875, -0.379058837890625, -0.3412017822265625, -0.3033447265625, -0.2654876708984375, -0.227630615234375, -0.1897735595703125, -0.15191650390625, -0.1140594482421875, -0.076202392578125, -0.0383453369140625, -0.00048828125, 0.0373687744140625, 0.075225830078125, 0.1130828857421875, 0.15093994140625, 0.1887969970703125, 0.226654052734375, 0.2645111083984375, 0.3023681640625, 0.3402252197265625, 0.378082275390625, 0.4159393310546875, 0.45379638671875, 0.4916534423828125, 0.529510498046875, 0.5673675537109375, 0.605224609375, 0.6430816650390625, 0.680938720703125, 0.7187957763671875, 0.75665283203125, 0.7945098876953125, 0.832366943359375, 0.8702239990234375, 0.9080810546875, 0.9459381103515625, 0.983795166015625, 1.0216522216796875, 1.05950927734375, 1.0973663330078125, 1.135223388671875, 1.1730804443359375, 1.2109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 6.0, 9.0, 1.0, 3.0, 14.0, 14.0, 6.0, 15.0, 14.0, 17.0, 25.0, 26.0, 26.0, 27.0, 34.0, 37.0, 55.0, 53.0, 52.0, 37.0, 45.0, 35.0, 43.0, 50.0, 33.0, 31.0, 34.0, 29.0, 32.0, 31.0, 23.0, 25.0, 18.0, 13.0, 18.0, 11.0, 10.0, 6.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-0.98486328125, -0.9564208984375, -0.927978515625, -0.8995361328125, -0.87109375, -0.8426513671875, -0.814208984375, -0.7857666015625, -0.75732421875, -0.7288818359375, -0.700439453125, -0.6719970703125, -0.6435546875, -0.6151123046875, -0.586669921875, -0.5582275390625, -0.52978515625, -0.5013427734375, -0.472900390625, -0.4444580078125, -0.416015625, -0.3875732421875, -0.359130859375, -0.3306884765625, -0.30224609375, -0.2738037109375, -0.245361328125, -0.2169189453125, -0.1884765625, -0.1600341796875, -0.131591796875, -0.1031494140625, -0.07470703125, -0.0462646484375, -0.017822265625, 0.0106201171875, 0.0390625, 0.0675048828125, 0.095947265625, 0.1243896484375, 0.15283203125, 0.1812744140625, 0.209716796875, 0.2381591796875, 0.2666015625, 0.2950439453125, 0.323486328125, 0.3519287109375, 0.38037109375, 0.4088134765625, 0.437255859375, 0.4656982421875, 0.494140625, 0.5225830078125, 0.551025390625, 0.5794677734375, 0.60791015625, 0.6363525390625, 0.664794921875, 0.6932373046875, 0.7216796875, 0.7501220703125, 0.778564453125, 0.8070068359375, 0.83544921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 5.0, 6.0, 8.0, 9.0, 11.0, 8.0, 20.0, 20.0, 27.0, 38.0, 50.0, 79.0, 120.0, 259.0, 618.0, 1524.0, 5149.0, 26828.0, 229210.0, 3078198.0, 770826.0, 66470.0, 10455.0, 2567.0, 935.0, 337.0, 163.0, 96.0, 50.0, 45.0, 22.0, 20.0, 11.0, 18.0, 21.0, 6.0, 9.0, 9.0, 7.0, 4.0, 5.0, 0.0, 1.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9140625, -5.7276611328125, -5.541259765625, -5.3548583984375, -5.16845703125, -4.9820556640625, -4.795654296875, -4.6092529296875, -4.4228515625, -4.2364501953125, -4.050048828125, -3.8636474609375, -3.67724609375, -3.4908447265625, -3.304443359375, -3.1180419921875, -2.931640625, -2.7452392578125, -2.558837890625, -2.3724365234375, -2.18603515625, -1.9996337890625, -1.813232421875, -1.6268310546875, -1.4404296875, -1.2540283203125, -1.067626953125, -0.8812255859375, -0.69482421875, -0.5084228515625, -0.322021484375, -0.1356201171875, 0.05078125, 0.2371826171875, 0.423583984375, 0.6099853515625, 0.79638671875, 0.9827880859375, 1.169189453125, 1.3555908203125, 1.5419921875, 1.7283935546875, 1.914794921875, 2.1011962890625, 2.28759765625, 2.4739990234375, 2.660400390625, 2.8468017578125, 3.033203125, 3.2196044921875, 3.406005859375, 3.5924072265625, 3.77880859375, 3.9652099609375, 4.151611328125, 4.3380126953125, 4.5244140625, 4.7108154296875, 4.897216796875, 5.0836181640625, 5.27001953125, 5.4564208984375, 5.642822265625, 5.8292236328125, 6.015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 10.0, 33.0, 68.0, 112.0, 236.0, 489.0, 1284.0, 912.0, 452.0, 226.0, 130.0, 55.0, 32.0, 22.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.91796875, -6.7763671875, -6.634765625, -6.4931640625, -6.3515625, -6.2099609375, -6.068359375, -5.9267578125, -5.78515625, -5.6435546875, -5.501953125, -5.3603515625, -5.21875, -5.0771484375, -4.935546875, -4.7939453125, -4.65234375, -4.5107421875, -4.369140625, -4.2275390625, -4.0859375, -3.9443359375, -3.802734375, -3.6611328125, -3.51953125, -3.3779296875, -3.236328125, -3.0947265625, -2.953125, -2.8115234375, -2.669921875, -2.5283203125, -2.38671875, -2.2451171875, -2.103515625, -1.9619140625, -1.8203125, -1.6787109375, -1.537109375, -1.3955078125, -1.25390625, -1.1123046875, -0.970703125, -0.8291015625, -0.6875, -0.5458984375, -0.404296875, -0.2626953125, -0.12109375, 0.0205078125, 0.162109375, 0.3037109375, 0.4453125, 0.5869140625, 0.728515625, 0.8701171875, 1.01171875, 1.1533203125, 1.294921875, 1.4365234375, 1.578125, 1.7197265625, 1.861328125, 2.0029296875, 2.14453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 4.0, 0.0, 8.0, 13.0, 16.0, 30.0, 43.0, 55.0, 88.0, 95.0, 114.0, 118.0, 89.0, 87.0, 63.0, 62.0, 40.0, 27.0, 17.0, 21.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.139472961425781, -5.714046001434326, -5.288619518280029, -4.863192558288574, -4.437766075134277, -4.012339115142822, -3.5869123935699463, -3.1614856719970703, -2.7360589504241943, -2.3106322288513184, -1.8852055072784424, -1.4597786664962769, -1.0343519449234009, -0.6089251041412354, -0.18349838256835938, 0.2419283390045166, 0.6673550605773926, 1.0927817821502686, 1.5182085037231445, 1.94363534450531, 2.3690619468688965, 2.7944889068603516, 3.2199156284332275, 3.6453423500061035, 4.070769309997559, 4.496196269989014, 4.9216227531433105, 5.347049713134766, 5.7724761962890625, 6.197903156280518, 6.623330116271973, 7.0487565994262695, 7.474183082580566, 7.8996100425720215, 8.325037002563477, 8.750463485717773, 9.17588996887207, 9.601316452026367, 10.02674388885498, 10.452170372009277, 10.877596855163574, 11.303023338317871, 11.728450775146484, 12.153877258300781, 12.579303741455078, 13.004730224609375, 13.430157661437988, 13.855584144592285, 14.281011581420898, 14.706438064575195, 15.131865501403809, 15.557291984558105, 15.982718467712402, 16.408145904541016, 16.833572387695312, 17.25899887084961, 17.684425354003906, 18.109851837158203, 18.5352783203125, 18.960704803466797, 19.386133193969727, 19.811559677124023, 20.23698616027832, 20.662412643432617, 21.087839126586914]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 7.0, 6.0, 7.0, 13.0, 8.0, 15.0, 18.0, 13.0, 14.0, 12.0, 26.0, 32.0, 29.0, 16.0, 36.0, 45.0, 29.0, 33.0, 50.0, 38.0, 48.0, 36.0, 33.0, 36.0, 28.0, 27.0, 36.0, 29.0, 28.0, 22.0, 18.0, 23.0, 22.0, 23.0, 14.0, 16.0, 16.0, 15.0, 14.0, 13.0, 9.0, 4.0, 6.0, 9.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0], "bins": [-6.529906272888184, -6.333456039428711, -6.137005805969238, -5.940556049346924, -5.744105815887451, -5.5476555824279785, -5.351205825805664, -5.154755592346191, -4.958305358886719, -4.761855125427246, -4.565404891967773, -4.368955135345459, -4.172504901885986, -3.9760546684265137, -3.77960467338562, -3.5831546783447266, -3.386704444885254, -3.1902542114257812, -2.9938042163848877, -2.797354221343994, -2.6009039878845215, -2.404453754425049, -2.2080037593841553, -2.0115537643432617, -1.815103530883789, -1.618653416633606, -1.4222033023834229, -1.2257531881332397, -1.0293030738830566, -0.8328529596328735, -0.6364028453826904, -0.4399527311325073, -0.24350214004516602, -0.04705202579498291, 0.1493980884552002, 0.3458482027053833, 0.5422983169555664, 0.7387484312057495, 0.9351985454559326, 1.1316486597061157, 1.3280987739562988, 1.524548888206482, 1.720999002456665, 1.9174491167068481, 2.1138992309570312, 2.310349464416504, 2.5067994594573975, 2.703249454498291, 2.8996996879577637, 3.0961499214172363, 3.29259991645813, 3.4890499114990234, 3.685500144958496, 3.8819503784179688, 4.078400611877441, 4.274850368499756, 4.4713006019592285, 4.667750835418701, 4.864200592041016, 5.060650825500488, 5.257101058959961, 5.453551292419434, 5.650001525878906, 5.846451282501221, 6.042901515960693]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 10.0, 17.0, 19.0, 33.0, 57.0, 102.0, 130.0, 190.0, 302.0, 402.0, 669.0, 985.0, 1468.0, 2305.0, 3414.0, 5241.0, 8282.0, 12982.0, 20629.0, 34605.0, 62382.0, 119319.0, 211202.0, 233551.0, 146800.0, 76003.0, 41343.0, 24060.0, 14887.0, 9589.0, 6146.0, 3970.0, 2625.0, 1638.0, 1038.0, 726.0, 487.0, 303.0, 201.0, 155.0, 99.0, 57.0, 51.0, 25.0, 15.0, 10.0, 5.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2294921875, -1.188720703125, -1.14794921875, -1.107177734375, -1.06640625, -1.025634765625, -0.98486328125, -0.944091796875, -0.9033203125, -0.862548828125, -0.82177734375, -0.781005859375, -0.740234375, -0.699462890625, -0.65869140625, -0.617919921875, -0.5771484375, -0.536376953125, -0.49560546875, -0.454833984375, -0.4140625, -0.373291015625, -0.33251953125, -0.291748046875, -0.2509765625, -0.210205078125, -0.16943359375, -0.128662109375, -0.087890625, -0.047119140625, -0.00634765625, 0.034423828125, 0.0751953125, 0.115966796875, 0.15673828125, 0.197509765625, 0.23828125, 0.279052734375, 0.31982421875, 0.360595703125, 0.4013671875, 0.442138671875, 0.48291015625, 0.523681640625, 0.564453125, 0.605224609375, 0.64599609375, 0.686767578125, 0.7275390625, 0.768310546875, 0.80908203125, 0.849853515625, 0.890625, 0.931396484375, 0.97216796875, 1.012939453125, 1.0537109375, 1.094482421875, 1.13525390625, 1.176025390625, 1.216796875, 1.257568359375, 1.29833984375, 1.339111328125, 1.3798828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 11.0, 11.0, 15.0, 17.0, 13.0, 19.0, 16.0, 26.0, 35.0, 37.0, 43.0, 42.0, 41.0, 56.0, 46.0, 40.0, 47.0, 45.0, 48.0, 43.0, 34.0, 36.0, 44.0, 25.0, 28.0, 26.0, 27.0, 14.0, 16.0, 17.0, 14.0, 10.0, 7.0, 8.0, 4.0, 12.0, 3.0, 5.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.267578125, -1.23101806640625, -1.1944580078125, -1.15789794921875, -1.121337890625, -1.08477783203125, -1.0482177734375, -1.01165771484375, -0.97509765625, -0.93853759765625, -0.9019775390625, -0.86541748046875, -0.828857421875, -0.79229736328125, -0.7557373046875, -0.71917724609375, -0.6826171875, -0.64605712890625, -0.6094970703125, -0.57293701171875, -0.536376953125, -0.49981689453125, -0.4632568359375, -0.42669677734375, -0.39013671875, -0.35357666015625, -0.3170166015625, -0.28045654296875, -0.243896484375, -0.20733642578125, -0.1707763671875, -0.13421630859375, -0.09765625, -0.06109619140625, -0.0245361328125, 0.01202392578125, 0.048583984375, 0.08514404296875, 0.1217041015625, 0.15826416015625, 0.19482421875, 0.23138427734375, 0.2679443359375, 0.30450439453125, 0.341064453125, 0.37762451171875, 0.4141845703125, 0.45074462890625, 0.4873046875, 0.52386474609375, 0.5604248046875, 0.59698486328125, 0.633544921875, 0.67010498046875, 0.7066650390625, 0.74322509765625, 0.77978515625, 0.81634521484375, 0.8529052734375, 0.88946533203125, 0.926025390625, 0.96258544921875, 0.9991455078125, 1.03570556640625, 1.072265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 14.0, 13.0, 13.0, 13.0, 26.0, 23.0, 37.0, 61.0, 107.0, 261.0, 625.0, 1753.0, 5108.0, 18257.0, 80114.0, 519118.0, 350411.0, 53164.0, 13235.0, 3896.0, 1343.0, 463.0, 179.0, 94.0, 51.0, 28.0, 18.0, 23.0, 23.0, 14.0, 7.0, 7.0, 9.0, 8.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.20684814453125, -4.0660400390625, -3.92523193359375, -3.784423828125, -3.64361572265625, -3.5028076171875, -3.36199951171875, -3.22119140625, -3.08038330078125, -2.9395751953125, -2.79876708984375, -2.657958984375, -2.51715087890625, -2.3763427734375, -2.23553466796875, -2.0947265625, -1.95391845703125, -1.8131103515625, -1.67230224609375, -1.531494140625, -1.39068603515625, -1.2498779296875, -1.10906982421875, -0.96826171875, -0.82745361328125, -0.6866455078125, -0.54583740234375, -0.405029296875, -0.26422119140625, -0.1234130859375, 0.01739501953125, 0.158203125, 0.29901123046875, 0.4398193359375, 0.58062744140625, 0.721435546875, 0.86224365234375, 1.0030517578125, 1.14385986328125, 1.28466796875, 1.42547607421875, 1.5662841796875, 1.70709228515625, 1.847900390625, 1.98870849609375, 2.1295166015625, 2.27032470703125, 2.4111328125, 2.55194091796875, 2.6927490234375, 2.83355712890625, 2.974365234375, 3.11517333984375, 3.2559814453125, 3.39678955078125, 3.53759765625, 3.67840576171875, 3.8192138671875, 3.96002197265625, 4.100830078125, 4.24163818359375, 4.3824462890625, 4.52325439453125, 4.6640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 4.0, 4.0, 8.0, 7.0, 9.0, 8.0, 12.0, 12.0, 21.0, 22.0, 20.0, 33.0, 31.0, 35.0, 45.0, 49.0, 42.0, 41.0, 56.0, 55.0, 42.0, 48.0, 43.0, 49.0, 50.0, 48.0, 37.0, 29.0, 27.0, 21.0, 22.0, 14.0, 10.0, 11.0, 11.0, 10.0, 4.0, 6.0, 6.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.724609375, -3.6060791015625, -3.487548828125, -3.3690185546875, -3.25048828125, -3.1319580078125, -3.013427734375, -2.8948974609375, -2.7763671875, -2.6578369140625, -2.539306640625, -2.4207763671875, -2.30224609375, -2.1837158203125, -2.065185546875, -1.9466552734375, -1.828125, -1.7095947265625, -1.591064453125, -1.4725341796875, -1.35400390625, -1.2354736328125, -1.116943359375, -0.9984130859375, -0.8798828125, -0.7613525390625, -0.642822265625, -0.5242919921875, -0.40576171875, -0.2872314453125, -0.168701171875, -0.0501708984375, 0.068359375, 0.1868896484375, 0.305419921875, 0.4239501953125, 0.54248046875, 0.6610107421875, 0.779541015625, 0.8980712890625, 1.0166015625, 1.1351318359375, 1.253662109375, 1.3721923828125, 1.49072265625, 1.6092529296875, 1.727783203125, 1.8463134765625, 1.96484375, 2.0833740234375, 2.201904296875, 2.3204345703125, 2.43896484375, 2.5574951171875, 2.676025390625, 2.7945556640625, 2.9130859375, 3.0316162109375, 3.150146484375, 3.2686767578125, 3.38720703125, 3.5057373046875, 3.624267578125, 3.7427978515625, 3.861328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 12.0, 8.0, 10.0, 17.0, 33.0, 26.0, 32.0, 54.0, 71.0, 94.0, 136.0, 206.0, 318.0, 491.0, 779.0, 1464.0, 3167.0, 7598.0, 21761.0, 67224.0, 274058.0, 488721.0, 123806.0, 36410.0, 12399.0, 4655.0, 2134.0, 1026.0, 590.0, 387.0, 231.0, 174.0, 130.0, 89.0, 62.0, 49.0, 29.0, 23.0, 21.0, 11.0, 15.0, 8.0, 8.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7216796875, -1.66656494140625, -1.6114501953125, -1.55633544921875, -1.501220703125, -1.44610595703125, -1.3909912109375, -1.33587646484375, -1.28076171875, -1.22564697265625, -1.1705322265625, -1.11541748046875, -1.060302734375, -1.00518798828125, -0.9500732421875, -0.89495849609375, -0.83984375, -0.78472900390625, -0.7296142578125, -0.67449951171875, -0.619384765625, -0.56427001953125, -0.5091552734375, -0.45404052734375, -0.39892578125, -0.34381103515625, -0.2886962890625, -0.23358154296875, -0.178466796875, -0.12335205078125, -0.0682373046875, -0.01312255859375, 0.0419921875, 0.09710693359375, 0.1522216796875, 0.20733642578125, 0.262451171875, 0.31756591796875, 0.3726806640625, 0.42779541015625, 0.48291015625, 0.53802490234375, 0.5931396484375, 0.64825439453125, 0.703369140625, 0.75848388671875, 0.8135986328125, 0.86871337890625, 0.923828125, 0.97894287109375, 1.0340576171875, 1.08917236328125, 1.144287109375, 1.19940185546875, 1.2545166015625, 1.30963134765625, 1.36474609375, 1.41986083984375, 1.4749755859375, 1.53009033203125, 1.585205078125, 1.64031982421875, 1.6954345703125, 1.75054931640625, 1.8056640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 5.0, 5.0, 12.0, 12.0, 8.0, 23.0, 35.0, 27.0, 64.0, 118.0, 188.0, 171.0, 119.0, 78.0, 38.0, 35.0, 22.0, 16.0, 8.0, 10.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0005817413330078125, -0.0005691144615411758, -0.0005564875900745392, -0.0005438607186079025, -0.0005312338471412659, -0.0005186069756746292, -0.0005059801042079926, -0.0004933532327413559, -0.00048072636127471924, -0.0004680994898080826, -0.0004554726183414459, -0.00044284574687480927, -0.0004302188754081726, -0.00041759200394153595, -0.0004049651324748993, -0.00039233826100826263, -0.000379711389541626, -0.0003670845180749893, -0.00035445764660835266, -0.000341830775141716, -0.00032920390367507935, -0.0003165770322084427, -0.00030395016074180603, -0.00029132328927516937, -0.0002786964178085327, -0.00026606954634189606, -0.0002534426748752594, -0.00024081580340862274, -0.00022818893194198608, -0.00021556206047534943, -0.00020293518900871277, -0.0001903083175420761, -0.00017768144607543945, -0.0001650545746088028, -0.00015242770314216614, -0.00013980083167552948, -0.00012717396020889282, -0.00011454708874225616, -0.00010192021727561951, -8.929334580898285e-05, -7.666647434234619e-05, -6.403960287570953e-05, -5.1412731409072876e-05, -3.878585994243622e-05, -2.615898847579956e-05, -1.3532117009162903e-05, -9.052455425262451e-07, 1.1721625924110413e-05, 2.434849739074707e-05, 3.697536885738373e-05, 4.9602240324020386e-05, 6.222911179065704e-05, 7.48559832572937e-05, 8.748285472393036e-05, 0.00010010972619056702, 0.00011273659765720367, 0.00012536346912384033, 0.000137990340590477, 0.00015061721205711365, 0.0001632440835237503, 0.00017587095499038696, 0.00018849782645702362, 0.00020112469792366028, 0.00021375156939029694, 0.0002263784408569336]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 8.0, 11.0, 9.0, 12.0, 17.0, 23.0, 32.0, 43.0, 89.0, 82.0, 122.0, 218.0, 362.0, 626.0, 1098.0, 2084.0, 4228.0, 9330.0, 22092.0, 56180.0, 167631.0, 450709.0, 216636.0, 68792.0, 26621.0, 11105.0, 4917.0, 2408.0, 1251.0, 644.0, 380.0, 248.0, 159.0, 116.0, 72.0, 50.0, 34.0, 23.0, 23.0, 15.0, 16.0, 12.0, 4.0, 6.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3125, -1.2696075439453125, -1.226715087890625, -1.1838226318359375, -1.14093017578125, -1.0980377197265625, -1.055145263671875, -1.0122528076171875, -0.9693603515625, -0.9264678955078125, -0.883575439453125, -0.8406829833984375, -0.79779052734375, -0.7548980712890625, -0.712005615234375, -0.6691131591796875, -0.626220703125, -0.5833282470703125, -0.540435791015625, -0.4975433349609375, -0.45465087890625, -0.4117584228515625, -0.368865966796875, -0.3259735107421875, -0.2830810546875, -0.2401885986328125, -0.197296142578125, -0.1544036865234375, -0.11151123046875, -0.0686187744140625, -0.025726318359375, 0.0171661376953125, 0.06005859375, 0.1029510498046875, 0.145843505859375, 0.1887359619140625, 0.23162841796875, 0.2745208740234375, 0.317413330078125, 0.3603057861328125, 0.4031982421875, 0.4460906982421875, 0.488983154296875, 0.5318756103515625, 0.57476806640625, 0.6176605224609375, 0.660552978515625, 0.7034454345703125, 0.746337890625, 0.7892303466796875, 0.832122802734375, 0.8750152587890625, 0.91790771484375, 0.9608001708984375, 1.003692626953125, 1.0465850830078125, 1.0894775390625, 1.1323699951171875, 1.175262451171875, 1.2181549072265625, 1.26104736328125, 1.3039398193359375, 1.346832275390625, 1.3897247314453125, 1.4326171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 2.0, 8.0, 9.0, 11.0, 17.0, 13.0, 28.0, 20.0, 38.0, 39.0, 67.0, 84.0, 105.0, 108.0, 106.0, 88.0, 50.0, 44.0, 35.0, 29.0, 19.0, 15.0, 8.0, 11.0, 9.0, 9.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.2639007568359375, -1.225067138671875, -1.1862335205078125, -1.14739990234375, -1.1085662841796875, -1.069732666015625, -1.0308990478515625, -0.9920654296875, -0.9532318115234375, -0.914398193359375, -0.8755645751953125, -0.83673095703125, -0.7978973388671875, -0.759063720703125, -0.7202301025390625, -0.681396484375, -0.6425628662109375, -0.603729248046875, -0.5648956298828125, -0.52606201171875, -0.4872283935546875, -0.448394775390625, -0.4095611572265625, -0.3707275390625, -0.3318939208984375, -0.293060302734375, -0.2542266845703125, -0.21539306640625, -0.1765594482421875, -0.137725830078125, -0.0988922119140625, -0.06005859375, -0.0212249755859375, 0.017608642578125, 0.0564422607421875, 0.09527587890625, 0.1341094970703125, 0.172943115234375, 0.2117767333984375, 0.2506103515625, 0.2894439697265625, 0.328277587890625, 0.3671112060546875, 0.40594482421875, 0.4447784423828125, 0.483612060546875, 0.5224456787109375, 0.561279296875, 0.6001129150390625, 0.638946533203125, 0.6777801513671875, 0.71661376953125, 0.7554473876953125, 0.794281005859375, 0.8331146240234375, 0.8719482421875, 0.9107818603515625, 0.949615478515625, 0.9884490966796875, 1.02728271484375, 1.0661163330078125, 1.104949951171875, 1.1437835693359375, 1.1826171875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 18.0, 34.0, 55.0, 97.0, 103.0, 142.0, 153.0, 135.0, 94.0, 72.0, 41.0, 30.0, 12.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.198183059692383, -18.63956642150879, -18.080949783325195, -17.5223331451416, -16.963716506958008, -16.405101776123047, -15.846484184265137, -15.287867546081543, -14.729251861572266, -14.170635223388672, -13.612018585205078, -13.053401947021484, -12.494786262512207, -11.936169624328613, -11.37755298614502, -10.818936347961426, -10.260319709777832, -9.701703071594238, -9.143086433410645, -8.584470748901367, -8.025854110717773, -7.46723747253418, -6.908620834350586, -6.350004196166992, -5.791388034820557, -5.232771396636963, -4.674155235290527, -4.115538597106934, -3.556922197341919, -2.9983057975769043, -2.4396891593933105, -1.881072759628296, -1.3224563598632812, -0.7638399004936218, -0.2052234411239624, 0.3533930778503418, 0.9120094776153564, 1.470625877380371, 2.029242515563965, 2.5878589153289795, 3.146475315093994, 3.705091714859009, 4.263708114624023, 4.822324752807617, 5.380941390991211, 5.9395575523376465, 6.49817419052124, 7.056790351867676, 7.6154069900512695, 8.174023628234863, 8.732640266418457, 9.291255950927734, 9.849872589111328, 10.408489227294922, 10.967105865478516, 11.52572250366211, 12.084339141845703, 12.642955780029297, 13.20157241821289, 13.760189056396484, 14.318804740905762, 14.877421379089355, 15.43603801727295, 15.994654655456543, 16.55327033996582]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 8.0, 9.0, 8.0, 8.0, 10.0, 19.0, 18.0, 22.0, 22.0, 27.0, 30.0, 41.0, 26.0, 32.0, 36.0, 50.0, 37.0, 39.0, 32.0, 40.0, 42.0, 38.0, 33.0, 42.0, 25.0, 28.0, 33.0, 27.0, 28.0, 26.0, 26.0, 15.0, 16.0, 15.0, 10.0, 17.0, 7.0, 6.0, 12.0, 10.0, 6.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.37156867980957, -9.097650527954102, -8.823732376098633, -8.54981517791748, -8.275897026062012, -8.001978874206543, -7.728060722351074, -7.4541425704956055, -7.180224895477295, -6.906306743621826, -6.632389068603516, -6.358470916748047, -6.084552764892578, -5.810635089874268, -5.536716938018799, -5.262799263000488, -4.9888811111450195, -4.714962959289551, -4.44104528427124, -4.1671271324157715, -3.893209218978882, -3.619291305541992, -3.3453731536865234, -3.071455240249634, -2.797537326812744, -2.5236194133758545, -2.249701499938965, -1.975783348083496, -1.7018654346466064, -1.4279475212097168, -1.1540294885635376, -0.8801114559173584, -0.6061944961547852, -0.33227652311325073, -0.05835855007171631, 0.21555942296981812, 0.48947739601135254, 0.7633953094482422, 1.0373133420944214, 1.3112313747406006, 1.5851492881774902, 1.8590672016143799, 2.1329851150512695, 2.4069032669067383, 2.680821180343628, 2.9547390937805176, 3.2286572456359863, 3.502575159072876, 3.7764930725097656, 4.050411224365234, 4.324328899383545, 4.598247051239014, 4.872164726257324, 5.146082878112793, 5.420001029968262, 5.6939191818237305, 5.967836856842041, 6.24175500869751, 6.51567268371582, 6.789590835571289, 7.063508987426758, 7.337426662445068, 7.611344814300537, 7.885262489318848, 8.159180641174316]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 12.0, 18.0, 25.0, 26.0, 51.0, 70.0, 101.0, 169.0, 314.0, 486.0, 818.0, 1404.0, 2627.0, 5059.0, 10714.0, 23999.0, 59414.0, 170632.0, 645969.0, 2336788.0, 654909.0, 174114.0, 60732.0, 24413.0, 10536.0, 4957.0, 2518.0, 1422.0, 747.0, 461.0, 271.0, 165.0, 101.0, 57.0, 40.0, 33.0, 20.0, 20.0, 12.0, 11.0, 7.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.322265625, -2.250823974609375, -2.17938232421875, -2.107940673828125, -2.0364990234375, -1.965057373046875, -1.89361572265625, -1.822174072265625, -1.750732421875, -1.679290771484375, -1.60784912109375, -1.536407470703125, -1.4649658203125, -1.393524169921875, -1.32208251953125, -1.250640869140625, -1.17919921875, -1.107757568359375, -1.03631591796875, -0.964874267578125, -0.8934326171875, -0.821990966796875, -0.75054931640625, -0.679107666015625, -0.607666015625, -0.536224365234375, -0.46478271484375, -0.393341064453125, -0.3218994140625, -0.250457763671875, -0.17901611328125, -0.107574462890625, -0.0361328125, 0.035308837890625, 0.10675048828125, 0.178192138671875, 0.2496337890625, 0.321075439453125, 0.39251708984375, 0.463958740234375, 0.535400390625, 0.606842041015625, 0.67828369140625, 0.749725341796875, 0.8211669921875, 0.892608642578125, 0.96405029296875, 1.035491943359375, 1.10693359375, 1.178375244140625, 1.24981689453125, 1.321258544921875, 1.3927001953125, 1.464141845703125, 1.53558349609375, 1.607025146484375, 1.678466796875, 1.749908447265625, 1.82135009765625, 1.892791748046875, 1.9642333984375, 2.035675048828125, 2.10711669921875, 2.178558349609375, 2.25]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 7.0, 2.0, 3.0, 8.0, 14.0, 9.0, 12.0, 17.0, 17.0, 18.0, 32.0, 34.0, 31.0, 28.0, 35.0, 40.0, 36.0, 43.0, 42.0, 34.0, 48.0, 43.0, 51.0, 35.0, 46.0, 39.0, 35.0, 34.0, 33.0, 37.0, 23.0, 23.0, 15.0, 20.0, 17.0, 8.0, 5.0, 5.0, 5.0, 4.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.1904296875, -1.1539306640625, -1.117431640625, -1.0809326171875, -1.04443359375, -1.0079345703125, -0.971435546875, -0.9349365234375, -0.8984375, -0.8619384765625, -0.825439453125, -0.7889404296875, -0.75244140625, -0.7159423828125, -0.679443359375, -0.6429443359375, -0.6064453125, -0.5699462890625, -0.533447265625, -0.4969482421875, -0.46044921875, -0.4239501953125, -0.387451171875, -0.3509521484375, -0.314453125, -0.2779541015625, -0.241455078125, -0.2049560546875, -0.16845703125, -0.1319580078125, -0.095458984375, -0.0589599609375, -0.0224609375, 0.0140380859375, 0.050537109375, 0.0870361328125, 0.12353515625, 0.1600341796875, 0.196533203125, 0.2330322265625, 0.26953125, 0.3060302734375, 0.342529296875, 0.3790283203125, 0.41552734375, 0.4520263671875, 0.488525390625, 0.5250244140625, 0.5615234375, 0.5980224609375, 0.634521484375, 0.6710205078125, 0.70751953125, 0.7440185546875, 0.780517578125, 0.8170166015625, 0.853515625, 0.8900146484375, 0.926513671875, 0.9630126953125, 0.99951171875, 1.0360107421875, 1.072509765625, 1.1090087890625, 1.1455078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 8.0, 16.0, 17.0, 15.0, 28.0, 39.0, 42.0, 55.0, 77.0, 127.0, 182.0, 264.0, 485.0, 851.0, 1714.0, 3660.0, 8697.0, 24233.0, 80693.0, 355768.0, 2442464.0, 1029633.0, 173500.0, 45314.0, 14942.0, 5832.0, 2585.0, 1243.0, 663.0, 368.0, 233.0, 164.0, 111.0, 64.0, 61.0, 31.0, 27.0, 16.0, 17.0, 10.0, 8.0, 8.0, 5.0, 3.0, 1.0, 4.0, 5.0, 1.0], "bins": [-4.875, -4.742431640625, -4.60986328125, -4.477294921875, -4.3447265625, -4.212158203125, -4.07958984375, -3.947021484375, -3.814453125, -3.681884765625, -3.54931640625, -3.416748046875, -3.2841796875, -3.151611328125, -3.01904296875, -2.886474609375, -2.75390625, -2.621337890625, -2.48876953125, -2.356201171875, -2.2236328125, -2.091064453125, -1.95849609375, -1.825927734375, -1.693359375, -1.560791015625, -1.42822265625, -1.295654296875, -1.1630859375, -1.030517578125, -0.89794921875, -0.765380859375, -0.6328125, -0.500244140625, -0.36767578125, -0.235107421875, -0.1025390625, 0.030029296875, 0.16259765625, 0.295166015625, 0.427734375, 0.560302734375, 0.69287109375, 0.825439453125, 0.9580078125, 1.090576171875, 1.22314453125, 1.355712890625, 1.48828125, 1.620849609375, 1.75341796875, 1.885986328125, 2.0185546875, 2.151123046875, 2.28369140625, 2.416259765625, 2.548828125, 2.681396484375, 2.81396484375, 2.946533203125, 3.0791015625, 3.211669921875, 3.34423828125, 3.476806640625, 3.609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 11.0, 18.0, 28.0, 42.0, 71.0, 62.0, 124.0, 222.0, 338.0, 617.0, 948.0, 615.0, 363.0, 221.0, 129.0, 76.0, 53.0, 31.0, 36.0, 13.0, 18.0, 11.0, 4.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.941162109375, -3.81201171875, -3.682861328125, -3.5537109375, -3.424560546875, -3.29541015625, -3.166259765625, -3.037109375, -2.907958984375, -2.77880859375, -2.649658203125, -2.5205078125, -2.391357421875, -2.26220703125, -2.133056640625, -2.00390625, -1.874755859375, -1.74560546875, -1.616455078125, -1.4873046875, -1.358154296875, -1.22900390625, -1.099853515625, -0.970703125, -0.841552734375, -0.71240234375, -0.583251953125, -0.4541015625, -0.324951171875, -0.19580078125, -0.066650390625, 0.0625, 0.191650390625, 0.32080078125, 0.449951171875, 0.5791015625, 0.708251953125, 0.83740234375, 0.966552734375, 1.095703125, 1.224853515625, 1.35400390625, 1.483154296875, 1.6123046875, 1.741455078125, 1.87060546875, 1.999755859375, 2.12890625, 2.258056640625, 2.38720703125, 2.516357421875, 2.6455078125, 2.774658203125, 2.90380859375, 3.032958984375, 3.162109375, 3.291259765625, 3.42041015625, 3.549560546875, 3.6787109375, 3.807861328125, 3.93701171875, 4.066162109375, 4.1953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 8.0, 3.0, 8.0, 17.0, 24.0, 31.0, 34.0, 35.0, 34.0, 48.0, 52.0, 64.0, 56.0, 70.0, 76.0, 59.0, 55.0, 48.0, 41.0, 37.0, 38.0, 32.0, 20.0, 18.0, 13.0, 11.0, 17.0, 8.0, 10.0, 3.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.299647331237793, -10.990974426269531, -10.682300567626953, -10.373627662658691, -10.06495475769043, -9.756280899047852, -9.44760799407959, -9.138935089111328, -8.83026123046875, -8.521588325500488, -8.21291446685791, -7.904241561889648, -7.5955681800842285, -7.286894798278809, -6.978221893310547, -6.669548511505127, -6.360875606536865, -6.052202224731445, -5.743529319763184, -5.434855937957764, -5.126182556152344, -4.817509651184082, -4.508836269378662, -4.200162887573242, -3.8914897441864014, -3.5828166007995605, -3.2741432189941406, -2.9654700756073, -2.656796932220459, -2.348123550415039, -2.0394504070281982, -1.7307770252227783, -1.4221038818359375, -1.1134306192398071, -0.8047574162483215, -0.49608421325683594, -0.18741095066070557, 0.1212623119354248, 0.4299354553222656, 0.7386088371276855, 1.0472819805145264, 1.3559552431106567, 1.664628505706787, 1.973301649093628, 2.2819747924804688, 2.5906481742858887, 2.8993213176727295, 3.2079946994781494, 3.5166678428649902, 3.825340986251831, 4.134014129638672, 4.442687511444092, 4.751360893249512, 5.060033798217773, 5.368707180023193, 5.677380561828613, 5.986053466796875, 6.294726848602295, 6.603399753570557, 6.912073135375977, 7.2207465171813965, 7.529419898986816, 7.838092803955078, 8.146766662597656, 8.455439567565918]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 4.0, 14.0, 11.0, 16.0, 19.0, 18.0, 15.0, 17.0, 20.0, 19.0, 21.0, 23.0, 32.0, 37.0, 27.0, 24.0, 27.0, 36.0, 35.0, 36.0, 32.0, 26.0, 28.0, 32.0, 38.0, 35.0, 36.0, 23.0, 23.0, 24.0, 30.0, 30.0, 11.0, 21.0, 25.0, 18.0, 11.0, 22.0, 14.0, 6.0, 6.0, 7.0, 5.0, 9.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.652467727661133, -7.411046504974365, -7.1696248054504395, -6.928203582763672, -6.686781883239746, -6.4453606605529785, -6.203939437866211, -5.962517738342285, -5.721096038818359, -5.479674816131592, -5.238253116607666, -4.996831893920898, -4.755410194396973, -4.513988971710205, -4.2725677490234375, -4.031146049499512, -3.789724826812744, -3.5483033657073975, -3.306881904602051, -3.065460681915283, -2.8240389823913574, -2.58261775970459, -2.341196298599243, -2.0997748374938965, -1.8583533763885498, -1.6169319152832031, -1.3755104541778564, -1.1340891122817993, -0.8926676511764526, -0.651246190071106, -0.40982484817504883, -0.16840338706970215, 0.07301759719848633, 0.3144390285015106, 0.5558604598045349, 0.7972818613052368, 1.0387033224105835, 1.2801247835159302, 1.5215461254119873, 1.762967586517334, 2.0043890476226807, 2.2458105087280273, 2.487231969833374, 2.7286534309387207, 2.9700746536254883, 3.211496353149414, 3.4529175758361816, 3.6943390369415283, 3.935760498046875, 4.177181720733643, 4.418603420257568, 4.660024642944336, 4.901446342468262, 5.142867565155029, 5.384288787841797, 5.625710487365723, 5.867132186889648, 6.108553409576416, 6.349975109100342, 6.591396331787109, 6.832818031311035, 7.074239253997803, 7.31566047668457, 7.557082176208496, 7.798503398895264]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 9.0, 21.0, 23.0, 37.0, 59.0, 113.0, 137.0, 244.0, 416.0, 646.0, 1159.0, 2089.0, 3633.0, 6429.0, 11315.0, 20205.0, 38265.0, 80960.0, 201620.0, 349725.0, 179725.0, 72945.0, 35818.0, 18762.0, 10522.0, 5836.0, 3357.0, 1852.0, 1032.0, 623.0, 330.0, 251.0, 150.0, 70.0, 67.0, 42.0, 16.0, 17.0, 14.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48046875, -2.396209716796875, -2.31195068359375, -2.227691650390625, -2.1434326171875, -2.059173583984375, -1.97491455078125, -1.890655517578125, -1.806396484375, -1.722137451171875, -1.63787841796875, -1.553619384765625, -1.4693603515625, -1.385101318359375, -1.30084228515625, -1.216583251953125, -1.13232421875, -1.048065185546875, -0.96380615234375, -0.879547119140625, -0.7952880859375, -0.711029052734375, -0.62677001953125, -0.542510986328125, -0.458251953125, -0.373992919921875, -0.28973388671875, -0.205474853515625, -0.1212158203125, -0.036956787109375, 0.04730224609375, 0.131561279296875, 0.2158203125, 0.300079345703125, 0.38433837890625, 0.468597412109375, 0.5528564453125, 0.637115478515625, 0.72137451171875, 0.805633544921875, 0.889892578125, 0.974151611328125, 1.05841064453125, 1.142669677734375, 1.2269287109375, 1.311187744140625, 1.39544677734375, 1.479705810546875, 1.56396484375, 1.648223876953125, 1.73248291015625, 1.816741943359375, 1.9010009765625, 1.985260009765625, 2.06951904296875, 2.153778076171875, 2.238037109375, 2.322296142578125, 2.40655517578125, 2.490814208984375, 2.5750732421875, 2.659332275390625, 2.74359130859375, 2.827850341796875, 2.912109375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 7.0, 9.0, 22.0, 9.0, 21.0, 21.0, 15.0, 25.0, 35.0, 25.0, 41.0, 44.0, 42.0, 48.0, 40.0, 52.0, 51.0, 36.0, 53.0, 40.0, 44.0, 34.0, 37.0, 30.0, 28.0, 30.0, 23.0, 19.0, 16.0, 10.0, 13.0, 15.0, 10.0, 12.0, 4.0, 11.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.33984375, -1.29876708984375, -1.2576904296875, -1.21661376953125, -1.175537109375, -1.13446044921875, -1.0933837890625, -1.05230712890625, -1.01123046875, -0.97015380859375, -0.9290771484375, -0.88800048828125, -0.846923828125, -0.80584716796875, -0.7647705078125, -0.72369384765625, -0.6826171875, -0.64154052734375, -0.6004638671875, -0.55938720703125, -0.518310546875, -0.47723388671875, -0.4361572265625, -0.39508056640625, -0.35400390625, -0.31292724609375, -0.2718505859375, -0.23077392578125, -0.189697265625, -0.14862060546875, -0.1075439453125, -0.06646728515625, -0.025390625, 0.01568603515625, 0.0567626953125, 0.09783935546875, 0.138916015625, 0.17999267578125, 0.2210693359375, 0.26214599609375, 0.30322265625, 0.34429931640625, 0.3853759765625, 0.42645263671875, 0.467529296875, 0.50860595703125, 0.5496826171875, 0.59075927734375, 0.6318359375, 0.67291259765625, 0.7139892578125, 0.75506591796875, 0.796142578125, 0.83721923828125, 0.8782958984375, 0.91937255859375, 0.96044921875, 1.00152587890625, 1.0426025390625, 1.08367919921875, 1.124755859375, 1.16583251953125, 1.2069091796875, 1.24798583984375, 1.2890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 11.0, 18.0, 25.0, 41.0, 30.0, 63.0, 94.0, 212.0, 279.0, 520.0, 1003.0, 1968.0, 4332.0, 9609.0, 21189.0, 47134.0, 118697.0, 341130.0, 314858.0, 107360.0, 43594.0, 19502.0, 8996.0, 3913.0, 1854.0, 930.0, 486.0, 263.0, 154.0, 94.0, 60.0, 43.0, 20.0, 21.0, 12.0, 9.0, 10.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.65625, -2.55389404296875, -2.4515380859375, -2.34918212890625, -2.246826171875, -2.14447021484375, -2.0421142578125, -1.93975830078125, -1.83740234375, -1.73504638671875, -1.6326904296875, -1.53033447265625, -1.427978515625, -1.32562255859375, -1.2232666015625, -1.12091064453125, -1.0185546875, -0.91619873046875, -0.8138427734375, -0.71148681640625, -0.609130859375, -0.50677490234375, -0.4044189453125, -0.30206298828125, -0.19970703125, -0.09735107421875, 0.0050048828125, 0.10736083984375, 0.209716796875, 0.31207275390625, 0.4144287109375, 0.51678466796875, 0.619140625, 0.72149658203125, 0.8238525390625, 0.92620849609375, 1.028564453125, 1.13092041015625, 1.2332763671875, 1.33563232421875, 1.43798828125, 1.54034423828125, 1.6427001953125, 1.74505615234375, 1.847412109375, 1.94976806640625, 2.0521240234375, 2.15447998046875, 2.2568359375, 2.35919189453125, 2.4615478515625, 2.56390380859375, 2.666259765625, 2.76861572265625, 2.8709716796875, 2.97332763671875, 3.07568359375, 3.17803955078125, 3.2803955078125, 3.38275146484375, 3.485107421875, 3.58746337890625, 3.6898193359375, 3.79217529296875, 3.89453125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 7.0, 3.0, 2.0, 3.0, 6.0, 6.0, 12.0, 9.0, 8.0, 23.0, 15.0, 27.0, 32.0, 20.0, 42.0, 27.0, 36.0, 38.0, 48.0, 47.0, 46.0, 50.0, 43.0, 34.0, 56.0, 37.0, 42.0, 34.0, 33.0, 30.0, 31.0, 30.0, 21.0, 18.0, 20.0, 15.0, 9.0, 14.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.796875, -4.65948486328125, -4.5220947265625, -4.38470458984375, -4.247314453125, -4.10992431640625, -3.9725341796875, -3.83514404296875, -3.69775390625, -3.56036376953125, -3.4229736328125, -3.28558349609375, -3.148193359375, -3.01080322265625, -2.8734130859375, -2.73602294921875, -2.5986328125, -2.46124267578125, -2.3238525390625, -2.18646240234375, -2.049072265625, -1.91168212890625, -1.7742919921875, -1.63690185546875, -1.49951171875, -1.36212158203125, -1.2247314453125, -1.08734130859375, -0.949951171875, -0.81256103515625, -0.6751708984375, -0.53778076171875, -0.400390625, -0.26300048828125, -0.1256103515625, 0.01177978515625, 0.149169921875, 0.28656005859375, 0.4239501953125, 0.56134033203125, 0.69873046875, 0.83612060546875, 0.9735107421875, 1.11090087890625, 1.248291015625, 1.38568115234375, 1.5230712890625, 1.66046142578125, 1.7978515625, 1.93524169921875, 2.0726318359375, 2.21002197265625, 2.347412109375, 2.48480224609375, 2.6221923828125, 2.75958251953125, 2.89697265625, 3.03436279296875, 3.1717529296875, 3.30914306640625, 3.446533203125, 3.58392333984375, 3.7213134765625, 3.85870361328125, 3.99609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 11.0, 16.0, 20.0, 21.0, 30.0, 56.0, 84.0, 91.0, 143.0, 221.0, 319.0, 559.0, 862.0, 1380.0, 2557.0, 4452.0, 7872.0, 14475.0, 26820.0, 49869.0, 99085.0, 206745.0, 294640.0, 165591.0, 80999.0, 41387.0, 22151.0, 12145.0, 6575.0, 3749.0, 2108.0, 1264.0, 789.0, 473.0, 357.0, 205.0, 153.0, 88.0, 54.0, 40.0, 21.0, 24.0, 11.0, 14.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.1083984375, -1.075164794921875, -1.04193115234375, -1.008697509765625, -0.9754638671875, -0.942230224609375, -0.90899658203125, -0.875762939453125, -0.842529296875, -0.809295654296875, -0.77606201171875, -0.742828369140625, -0.7095947265625, -0.676361083984375, -0.64312744140625, -0.609893798828125, -0.57666015625, -0.543426513671875, -0.51019287109375, -0.476959228515625, -0.4437255859375, -0.410491943359375, -0.37725830078125, -0.344024658203125, -0.310791015625, -0.277557373046875, -0.24432373046875, -0.211090087890625, -0.1778564453125, -0.144622802734375, -0.11138916015625, -0.078155517578125, -0.044921875, -0.011688232421875, 0.02154541015625, 0.054779052734375, 0.0880126953125, 0.121246337890625, 0.15447998046875, 0.187713623046875, 0.220947265625, 0.254180908203125, 0.28741455078125, 0.320648193359375, 0.3538818359375, 0.387115478515625, 0.42034912109375, 0.453582763671875, 0.48681640625, 0.520050048828125, 0.55328369140625, 0.586517333984375, 0.6197509765625, 0.652984619140625, 0.68621826171875, 0.719451904296875, 0.752685546875, 0.785919189453125, 0.81915283203125, 0.852386474609375, 0.8856201171875, 0.918853759765625, 0.95208740234375, 0.985321044921875, 1.0185546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 9.0, 10.0, 10.0, 11.0, 15.0, 16.0, 24.0, 31.0, 41.0, 47.0, 93.0, 125.0, 113.0, 127.0, 84.0, 53.0, 40.0, 31.0, 27.0, 16.0, 15.0, 12.0, 10.0, 9.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003561973571777344, -0.0003445148468017578, -0.00033283233642578125, -0.0003211498260498047, -0.0003094673156738281, -0.00029778480529785156, -0.000286102294921875, -0.00027441978454589844, -0.0002627372741699219, -0.0002510547637939453, -0.00023937225341796875, -0.0002276897430419922, -0.00021600723266601562, -0.00020432472229003906, -0.0001926422119140625, -0.00018095970153808594, -0.00016927719116210938, -0.0001575946807861328, -0.00014591217041015625, -0.0001342296600341797, -0.00012254714965820312, -0.00011086463928222656, -9.918212890625e-05, -8.749961853027344e-05, -7.581710815429688e-05, -6.413459777832031e-05, -5.245208740234375e-05, -4.076957702636719e-05, -2.9087066650390625e-05, -1.7404556274414062e-05, -5.7220458984375e-06, 5.9604644775390625e-06, 1.7642974853515625e-05, 2.9325485229492188e-05, 4.100799560546875e-05, 5.269050598144531e-05, 6.437301635742188e-05, 7.605552673339844e-05, 8.7738037109375e-05, 9.942054748535156e-05, 0.00011110305786132812, 0.0001227855682373047, 0.00013446807861328125, 0.0001461505889892578, 0.00015783309936523438, 0.00016951560974121094, 0.0001811981201171875, 0.00019288063049316406, 0.00020456314086914062, 0.0002162456512451172, 0.00022792816162109375, 0.0002396106719970703, 0.0002512931823730469, 0.00026297569274902344, 0.000274658203125, 0.00028634071350097656, 0.0002980232238769531, 0.0003097057342529297, 0.00032138824462890625, 0.0003330707550048828, 0.0003447532653808594, 0.00035643577575683594, 0.0003681182861328125, 0.00037980079650878906, 0.0003914833068847656]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 10.0, 14.0, 25.0, 20.0, 37.0, 51.0, 78.0, 140.0, 232.0, 489.0, 932.0, 1858.0, 4521.0, 10885.0, 27781.0, 74780.0, 208217.0, 393055.0, 205208.0, 73793.0, 27449.0, 10700.0, 4477.0, 1853.0, 884.0, 418.0, 227.0, 122.0, 97.0, 48.0, 41.0, 32.0, 17.0, 12.0, 12.0, 7.0, 6.0, 2.0, 3.0, 6.0, 4.0, 0.0, 3.0, 3.0], "bins": [-1.7333984375, -1.687164306640625, -1.64093017578125, -1.594696044921875, -1.5484619140625, -1.502227783203125, -1.45599365234375, -1.409759521484375, -1.363525390625, -1.317291259765625, -1.27105712890625, -1.224822998046875, -1.1785888671875, -1.132354736328125, -1.08612060546875, -1.039886474609375, -0.99365234375, -0.947418212890625, -0.90118408203125, -0.854949951171875, -0.8087158203125, -0.762481689453125, -0.71624755859375, -0.670013427734375, -0.623779296875, -0.577545166015625, -0.53131103515625, -0.485076904296875, -0.4388427734375, -0.392608642578125, -0.34637451171875, -0.300140380859375, -0.25390625, -0.207672119140625, -0.16143798828125, -0.115203857421875, -0.0689697265625, -0.022735595703125, 0.02349853515625, 0.069732666015625, 0.115966796875, 0.162200927734375, 0.20843505859375, 0.254669189453125, 0.3009033203125, 0.347137451171875, 0.39337158203125, 0.439605712890625, 0.48583984375, 0.532073974609375, 0.57830810546875, 0.624542236328125, 0.6707763671875, 0.717010498046875, 0.76324462890625, 0.809478759765625, 0.855712890625, 0.901947021484375, 0.94818115234375, 0.994415283203125, 1.0406494140625, 1.086883544921875, 1.13311767578125, 1.179351806640625, 1.2255859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 0.0, 7.0, 5.0, 7.0, 4.0, 11.0, 21.0, 14.0, 20.0, 24.0, 30.0, 52.0, 69.0, 80.0, 105.0, 108.0, 100.0, 74.0, 60.0, 41.0, 39.0, 32.0, 18.0, 16.0, 13.0, 13.0, 10.0, 1.0, 4.0, 9.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8623046875, -1.8126068115234375, -1.762908935546875, -1.7132110595703125, -1.66351318359375, -1.6138153076171875, -1.564117431640625, -1.5144195556640625, -1.4647216796875, -1.4150238037109375, -1.365325927734375, -1.3156280517578125, -1.26593017578125, -1.2162322998046875, -1.166534423828125, -1.1168365478515625, -1.067138671875, -1.0174407958984375, -0.967742919921875, -0.9180450439453125, -0.86834716796875, -0.8186492919921875, -0.768951416015625, -0.7192535400390625, -0.6695556640625, -0.6198577880859375, -0.570159912109375, -0.5204620361328125, -0.47076416015625, -0.4210662841796875, -0.371368408203125, -0.3216705322265625, -0.27197265625, -0.2222747802734375, -0.172576904296875, -0.1228790283203125, -0.07318115234375, -0.0234832763671875, 0.026214599609375, 0.0759124755859375, 0.1256103515625, 0.1753082275390625, 0.225006103515625, 0.2747039794921875, 0.32440185546875, 0.3740997314453125, 0.423797607421875, 0.4734954833984375, 0.523193359375, 0.5728912353515625, 0.622589111328125, 0.6722869873046875, 0.72198486328125, 0.7716827392578125, 0.821380615234375, 0.8710784912109375, 0.9207763671875, 0.9704742431640625, 1.020172119140625, 1.0698699951171875, 1.11956787109375, 1.1692657470703125, 1.218963623046875, 1.2686614990234375, 1.318359375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 14.0, 4.0, 24.0, 37.0, 55.0, 69.0, 94.0, 100.0, 116.0, 104.0, 102.0, 89.0, 64.0, 48.0, 35.0, 21.0, 14.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.319637298583984, -21.731767654418945, -21.143896102905273, -20.556026458740234, -19.968154907226562, -19.380285263061523, -18.792415618896484, -18.204544067382812, -17.616674423217773, -17.028804779052734, -16.440933227539062, -15.853063583374023, -15.265192985534668, -14.677322387695312, -14.089452743530273, -13.501582145690918, -12.913711547851562, -12.325840950012207, -11.737970352172852, -11.150100708007812, -10.562230110168457, -9.974359512329102, -9.386489868164062, -8.798619270324707, -8.210748672485352, -7.622878074645996, -7.035007953643799, -6.447137832641602, -5.859267234802246, -5.271396636962891, -4.683526515960693, -4.095656394958496, -3.507783889770508, -2.9199135303497314, -2.332043170928955, -1.7441728115081787, -1.1563024520874023, -0.568432092666626, 0.01943826675415039, 0.6073083877563477, 1.1951789855957031, 1.7830493450164795, 2.370919704437256, 2.9587900638580322, 3.5466604232788086, 4.134531021118164, 4.722401142120361, 5.310271263122559, 5.898141860961914, 6.4860124588012695, 7.073882579803467, 7.661752700805664, 8.24962329864502, 8.837493896484375, 9.425363540649414, 10.01323413848877, 10.601104736328125, 11.18897533416748, 11.776845932006836, 12.364715576171875, 12.95258617401123, 13.540456771850586, 14.128326416015625, 14.71619701385498, 15.304067611694336]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 2.0, 6.0, 11.0, 8.0, 11.0, 17.0, 13.0, 18.0, 20.0, 21.0, 18.0, 28.0, 35.0, 35.0, 33.0, 32.0, 41.0, 40.0, 40.0, 53.0, 44.0, 45.0, 42.0, 38.0, 41.0, 40.0, 32.0, 35.0, 22.0, 27.0, 22.0, 20.0, 22.0, 21.0, 13.0, 12.0, 10.0, 6.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0], "bins": [-13.945759773254395, -13.527469635009766, -13.109179496765137, -12.690889358520508, -12.272599220275879, -11.85430908203125, -11.436019897460938, -11.017728805541992, -10.59943962097168, -10.18114948272705, -9.762859344482422, -9.344569206237793, -8.926279067993164, -8.507988929748535, -8.089698791503906, -7.6714091300964355, -7.253118515014648, -6.8348283767700195, -6.416538238525391, -5.998248100280762, -5.579957962036133, -5.161667823791504, -4.743378162384033, -4.325088024139404, -3.9067978858947754, -3.4885077476501465, -3.0702176094055176, -2.6519277095794678, -2.233637571334839, -1.81534743309021, -1.3970575332641602, -0.9787673950195312, -0.5604782104492188, -0.14218813180923462, 0.2761019468307495, 0.6943919658660889, 1.1126821041107178, 1.5309722423553467, 1.9492621421813965, 2.3675522804260254, 2.7858424186706543, 3.204132556915283, 3.622422695159912, 4.040712356567383, 4.459002494812012, 4.877292633056641, 5.2955827713012695, 5.713872909545898, 6.132163047790527, 6.550453186035156, 6.968743324279785, 7.387033462524414, 7.805323600769043, 8.223613739013672, 8.641902923583984, 9.06019401550293, 9.478483200073242, 9.896773338317871, 10.3150634765625, 10.733353614807129, 11.151643753051758, 11.569933891296387, 11.988224029541016, 12.406513214111328, 12.824804306030273]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 10.0, 21.0, 21.0, 40.0, 45.0, 73.0, 107.0, 167.0, 240.0, 377.0, 592.0, 865.0, 1477.0, 2240.0, 3820.0, 6502.0, 11812.0, 22672.0, 45071.0, 96032.0, 229414.0, 697434.0, 1902582.0, 738526.0, 238225.0, 99636.0, 45729.0, 22525.0, 11810.0, 6499.0, 3775.0, 2130.0, 1255.0, 840.0, 552.0, 355.0, 233.0, 176.0, 123.0, 84.0, 51.0, 38.0, 32.0, 20.0, 14.0, 8.0, 7.0, 5.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.654296875, -1.5982513427734375, -1.542205810546875, -1.4861602783203125, -1.43011474609375, -1.3740692138671875, -1.318023681640625, -1.2619781494140625, -1.2059326171875, -1.1498870849609375, -1.093841552734375, -1.0377960205078125, -0.98175048828125, -0.9257049560546875, -0.869659423828125, -0.8136138916015625, -0.757568359375, -0.7015228271484375, -0.645477294921875, -0.5894317626953125, -0.53338623046875, -0.4773406982421875, -0.421295166015625, -0.3652496337890625, -0.3092041015625, -0.2531585693359375, -0.197113037109375, -0.1410675048828125, -0.08502197265625, -0.0289764404296875, 0.027069091796875, 0.0831146240234375, 0.13916015625, 0.1952056884765625, 0.251251220703125, 0.3072967529296875, 0.36334228515625, 0.4193878173828125, 0.475433349609375, 0.5314788818359375, 0.5875244140625, 0.6435699462890625, 0.699615478515625, 0.7556610107421875, 0.81170654296875, 0.8677520751953125, 0.923797607421875, 0.9798431396484375, 1.035888671875, 1.0919342041015625, 1.147979736328125, 1.2040252685546875, 1.26007080078125, 1.3161163330078125, 1.372161865234375, 1.4282073974609375, 1.4842529296875, 1.5402984619140625, 1.596343994140625, 1.6523895263671875, 1.70843505859375, 1.7644805908203125, 1.820526123046875, 1.8765716552734375, 1.9326171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 3.0, 2.0, 9.0, 4.0, 15.0, 13.0, 4.0, 14.0, 14.0, 14.0, 22.0, 17.0, 30.0, 40.0, 40.0, 42.0, 44.0, 35.0, 53.0, 44.0, 38.0, 36.0, 48.0, 33.0, 33.0, 36.0, 42.0, 37.0, 41.0, 31.0, 25.0, 27.0, 19.0, 15.0, 12.0, 10.0, 9.0, 13.0, 6.0, 5.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.20703125, -1.165924072265625, -1.12481689453125, -1.083709716796875, -1.0426025390625, -1.001495361328125, -0.96038818359375, -0.919281005859375, -0.878173828125, -0.837066650390625, -0.79595947265625, -0.754852294921875, -0.7137451171875, -0.672637939453125, -0.63153076171875, -0.590423583984375, -0.54931640625, -0.508209228515625, -0.46710205078125, -0.425994873046875, -0.3848876953125, -0.343780517578125, -0.30267333984375, -0.261566162109375, -0.220458984375, -0.179351806640625, -0.13824462890625, -0.097137451171875, -0.0560302734375, -0.014923095703125, 0.02618408203125, 0.067291259765625, 0.1083984375, 0.149505615234375, 0.19061279296875, 0.231719970703125, 0.2728271484375, 0.313934326171875, 0.35504150390625, 0.396148681640625, 0.437255859375, 0.478363037109375, 0.51947021484375, 0.560577392578125, 0.6016845703125, 0.642791748046875, 0.68389892578125, 0.725006103515625, 0.76611328125, 0.807220458984375, 0.84832763671875, 0.889434814453125, 0.9305419921875, 0.971649169921875, 1.01275634765625, 1.053863525390625, 1.094970703125, 1.136077880859375, 1.17718505859375, 1.218292236328125, 1.2593994140625, 1.300506591796875, 1.34161376953125, 1.382720947265625, 1.423828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 6.0, 6.0, 8.0, 19.0, 22.0, 27.0, 44.0, 62.0, 71.0, 127.0, 204.0, 298.0, 669.0, 1437.0, 3881.0, 12730.0, 50799.0, 258966.0, 2273973.0, 1363857.0, 175472.0, 36454.0, 9480.0, 3150.0, 1174.0, 516.0, 307.0, 149.0, 107.0, 57.0, 53.0, 36.0, 31.0, 19.0, 7.0, 19.0, 15.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.53125, -4.3687744140625, -4.206298828125, -4.0438232421875, -3.88134765625, -3.7188720703125, -3.556396484375, -3.3939208984375, -3.2314453125, -3.0689697265625, -2.906494140625, -2.7440185546875, -2.58154296875, -2.4190673828125, -2.256591796875, -2.0941162109375, -1.931640625, -1.7691650390625, -1.606689453125, -1.4442138671875, -1.28173828125, -1.1192626953125, -0.956787109375, -0.7943115234375, -0.6318359375, -0.4693603515625, -0.306884765625, -0.1444091796875, 0.01806640625, 0.1805419921875, 0.343017578125, 0.5054931640625, 0.66796875, 0.8304443359375, 0.992919921875, 1.1553955078125, 1.31787109375, 1.4803466796875, 1.642822265625, 1.8052978515625, 1.9677734375, 2.1302490234375, 2.292724609375, 2.4552001953125, 2.61767578125, 2.7801513671875, 2.942626953125, 3.1051025390625, 3.267578125, 3.4300537109375, 3.592529296875, 3.7550048828125, 3.91748046875, 4.0799560546875, 4.242431640625, 4.4049072265625, 4.5673828125, 4.7298583984375, 4.892333984375, 5.0548095703125, 5.21728515625, 5.3797607421875, 5.542236328125, 5.7047119140625, 5.8671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 14.0, 25.0, 38.0, 63.0, 95.0, 152.0, 282.0, 464.0, 982.0, 956.0, 461.0, 213.0, 127.0, 77.0, 50.0, 27.0, 13.0, 10.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.41796875, -7.24505615234375, -7.0721435546875, -6.89923095703125, -6.726318359375, -6.55340576171875, -6.3804931640625, -6.20758056640625, -6.03466796875, -5.86175537109375, -5.6888427734375, -5.51593017578125, -5.343017578125, -5.17010498046875, -4.9971923828125, -4.82427978515625, -4.6513671875, -4.47845458984375, -4.3055419921875, -4.13262939453125, -3.959716796875, -3.78680419921875, -3.6138916015625, -3.44097900390625, -3.26806640625, -3.09515380859375, -2.9222412109375, -2.74932861328125, -2.576416015625, -2.40350341796875, -2.2305908203125, -2.05767822265625, -1.884765625, -1.71185302734375, -1.5389404296875, -1.36602783203125, -1.193115234375, -1.02020263671875, -0.8472900390625, -0.67437744140625, -0.50146484375, -0.32855224609375, -0.1556396484375, 0.01727294921875, 0.190185546875, 0.36309814453125, 0.5360107421875, 0.70892333984375, 0.8818359375, 1.05474853515625, 1.2276611328125, 1.40057373046875, 1.573486328125, 1.74639892578125, 1.9193115234375, 2.09222412109375, 2.26513671875, 2.43804931640625, 2.6109619140625, 2.78387451171875, 2.956787109375, 3.12969970703125, 3.3026123046875, 3.47552490234375, 3.6484375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 17.0, 32.0, 59.0, 109.0, 125.0, 126.0, 148.0, 132.0, 96.0, 69.0, 35.0, 24.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.11302185058594, -36.29410934448242, -35.475196838378906, -34.65628433227539, -33.837371826171875, -33.01845932006836, -32.199546813964844, -31.380632400512695, -30.56171989440918, -29.742807388305664, -28.92389488220215, -28.104982376098633, -27.286067962646484, -26.46715545654297, -25.648242950439453, -24.829330444335938, -24.010417938232422, -23.191505432128906, -22.37259292602539, -21.553680419921875, -20.73476791381836, -19.915855407714844, -19.096940994262695, -18.27802848815918, -17.459115982055664, -16.64020347595215, -15.821290969848633, -15.0023775100708, -14.183465003967285, -13.36455249786377, -12.545639038085938, -11.726726531982422, -10.907815933227539, -10.088903427124023, -9.269990921020508, -8.451077461242676, -7.63216495513916, -6.8132524490356445, -5.994339466094971, -5.175426483154297, -4.356513977050781, -3.5376012325286865, -2.718688488006592, -1.899775743484497, -1.0808629989624023, -0.2619504928588867, 0.5569624900817871, 1.375875473022461, 2.1947879791259766, 3.0137007236480713, 3.832613468170166, 4.65152645111084, 5.4704389572143555, 6.289351463317871, 7.108264446258545, 7.927177429199219, 8.746089935302734, 9.56500244140625, 10.383914947509766, 11.202828407287598, 12.021740913391113, 12.840653419494629, 13.659566879272461, 14.478479385375977, 15.297391891479492]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 8.0, 9.0, 15.0, 5.0, 16.0, 18.0, 25.0, 22.0, 21.0, 21.0, 35.0, 37.0, 37.0, 36.0, 37.0, 36.0, 35.0, 37.0, 41.0, 38.0, 39.0, 39.0, 37.0, 30.0, 32.0, 37.0, 37.0, 27.0, 24.0, 19.0, 19.0, 19.0, 15.0, 21.0, 13.0, 9.0, 3.0, 12.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.630386352539062, -10.316021919250488, -10.001657485961914, -9.68729305267334, -9.372928619384766, -9.058563232421875, -8.7441987991333, -8.429834365844727, -8.115469932556152, -7.801105499267578, -7.486741065979004, -7.1723761558532715, -6.858011722564697, -6.543647289276123, -6.229282379150391, -5.914917945861816, -5.600553512573242, -5.286189079284668, -4.971824645996094, -4.657459735870361, -4.343095302581787, -4.028730869293213, -3.7143661975860596, -3.4000015258789062, -3.085637092590332, -2.771272659301758, -2.4569079875946045, -2.142543315887451, -1.828178882598877, -1.5138143301010132, -1.1994497776031494, -0.8850851058959961, -0.5707206726074219, -0.2563561201095581, 0.058008432388305664, 0.37237298488616943, 0.6867375373840332, 1.001102089881897, 1.3154666423797607, 1.629831314086914, 1.9441957473754883, 2.2585601806640625, 2.572924852371216, 2.887289524078369, 3.2016539573669434, 3.5160183906555176, 3.830383062362671, 4.144747734069824, 4.459112167358398, 4.773476600646973, 5.087841033935547, 5.402205944061279, 5.7165703773498535, 6.030934810638428, 6.34529972076416, 6.659664154052734, 6.974028587341309, 7.288393020629883, 7.602757453918457, 7.9171223640441895, 8.231487274169922, 8.545851707458496, 8.86021614074707, 9.174580574035645, 9.488945007324219]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 7.0, 9.0, 5.0, 14.0, 25.0, 42.0, 55.0, 70.0, 109.0, 140.0, 225.0, 320.0, 489.0, 706.0, 1003.0, 1563.0, 2218.0, 3604.0, 5607.0, 9284.0, 15591.0, 27698.0, 58694.0, 163377.0, 388257.0, 217629.0, 72672.0, 33058.0, 17838.0, 10229.0, 6216.0, 3931.0, 2626.0, 1731.0, 1095.0, 785.0, 510.0, 336.0, 235.0, 192.0, 111.0, 69.0, 48.0, 38.0, 37.0, 15.0, 12.0, 16.0, 7.0, 4.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-2.53125, -2.455963134765625, -2.38067626953125, -2.305389404296875, -2.2301025390625, -2.154815673828125, -2.07952880859375, -2.004241943359375, -1.928955078125, -1.853668212890625, -1.77838134765625, -1.703094482421875, -1.6278076171875, -1.552520751953125, -1.47723388671875, -1.401947021484375, -1.32666015625, -1.251373291015625, -1.17608642578125, -1.100799560546875, -1.0255126953125, -0.950225830078125, -0.87493896484375, -0.799652099609375, -0.724365234375, -0.649078369140625, -0.57379150390625, -0.498504638671875, -0.4232177734375, -0.347930908203125, -0.27264404296875, -0.197357177734375, -0.1220703125, -0.046783447265625, 0.02850341796875, 0.103790283203125, 0.1790771484375, 0.254364013671875, 0.32965087890625, 0.404937744140625, 0.480224609375, 0.555511474609375, 0.63079833984375, 0.706085205078125, 0.7813720703125, 0.856658935546875, 0.93194580078125, 1.007232666015625, 1.08251953125, 1.157806396484375, 1.23309326171875, 1.308380126953125, 1.3836669921875, 1.458953857421875, 1.53424072265625, 1.609527587890625, 1.684814453125, 1.760101318359375, 1.83538818359375, 1.910675048828125, 1.9859619140625, 2.061248779296875, 2.13653564453125, 2.211822509765625, 2.287109375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 3.0, 10.0, 11.0, 20.0, 25.0, 26.0, 32.0, 30.0, 23.0, 31.0, 34.0, 48.0, 46.0, 50.0, 59.0, 54.0, 47.0, 54.0, 32.0, 41.0, 35.0, 40.0, 27.0, 36.0, 27.0, 28.0, 21.0, 22.0, 19.0, 14.0, 9.0, 8.0, 4.0, 7.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8154296875, -1.76361083984375, -1.7117919921875, -1.65997314453125, -1.608154296875, -1.55633544921875, -1.5045166015625, -1.45269775390625, -1.40087890625, -1.34906005859375, -1.2972412109375, -1.24542236328125, -1.193603515625, -1.14178466796875, -1.0899658203125, -1.03814697265625, -0.986328125, -0.93450927734375, -0.8826904296875, -0.83087158203125, -0.779052734375, -0.72723388671875, -0.6754150390625, -0.62359619140625, -0.57177734375, -0.51995849609375, -0.4681396484375, -0.41632080078125, -0.364501953125, -0.31268310546875, -0.2608642578125, -0.20904541015625, -0.1572265625, -0.10540771484375, -0.0535888671875, -0.00177001953125, 0.050048828125, 0.10186767578125, 0.1536865234375, 0.20550537109375, 0.25732421875, 0.30914306640625, 0.3609619140625, 0.41278076171875, 0.464599609375, 0.51641845703125, 0.5682373046875, 0.62005615234375, 0.671875, 0.72369384765625, 0.7755126953125, 0.82733154296875, 0.879150390625, 0.93096923828125, 0.9827880859375, 1.03460693359375, 1.08642578125, 1.13824462890625, 1.1900634765625, 1.24188232421875, 1.293701171875, 1.34552001953125, 1.3973388671875, 1.44915771484375, 1.5009765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 11.0, 14.0, 16.0, 29.0, 51.0, 86.0, 145.0, 223.0, 439.0, 772.0, 1601.0, 3294.0, 7017.0, 14795.0, 35566.0, 116166.0, 474850.0, 284086.0, 64735.0, 23978.0, 10599.0, 4971.0, 2451.0, 1259.0, 592.0, 313.0, 164.0, 109.0, 66.0, 34.0, 38.0, 17.0, 19.0, 10.0, 7.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.689453125, -3.576904296875, -3.46435546875, -3.351806640625, -3.2392578125, -3.126708984375, -3.01416015625, -2.901611328125, -2.7890625, -2.676513671875, -2.56396484375, -2.451416015625, -2.3388671875, -2.226318359375, -2.11376953125, -2.001220703125, -1.888671875, -1.776123046875, -1.66357421875, -1.551025390625, -1.4384765625, -1.325927734375, -1.21337890625, -1.100830078125, -0.98828125, -0.875732421875, -0.76318359375, -0.650634765625, -0.5380859375, -0.425537109375, -0.31298828125, -0.200439453125, -0.087890625, 0.024658203125, 0.13720703125, 0.249755859375, 0.3623046875, 0.474853515625, 0.58740234375, 0.699951171875, 0.8125, 0.925048828125, 1.03759765625, 1.150146484375, 1.2626953125, 1.375244140625, 1.48779296875, 1.600341796875, 1.712890625, 1.825439453125, 1.93798828125, 2.050537109375, 2.1630859375, 2.275634765625, 2.38818359375, 2.500732421875, 2.61328125, 2.725830078125, 2.83837890625, 2.950927734375, 3.0634765625, 3.176025390625, 3.28857421875, 3.401123046875, 3.513671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 8.0, 9.0, 10.0, 6.0, 21.0, 19.0, 15.0, 18.0, 24.0, 17.0, 21.0, 26.0, 28.0, 29.0, 30.0, 30.0, 37.0, 30.0, 28.0, 48.0, 38.0, 28.0, 34.0, 37.0, 37.0, 26.0, 35.0, 31.0, 21.0, 27.0, 22.0, 21.0, 22.0, 21.0, 18.0, 16.0, 15.0, 12.0, 10.0, 5.0, 12.0, 13.0, 6.0, 2.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.453125, -3.3436279296875, -3.234130859375, -3.1246337890625, -3.01513671875, -2.9056396484375, -2.796142578125, -2.6866455078125, -2.5771484375, -2.4676513671875, -2.358154296875, -2.2486572265625, -2.13916015625, -2.0296630859375, -1.920166015625, -1.8106689453125, -1.701171875, -1.5916748046875, -1.482177734375, -1.3726806640625, -1.26318359375, -1.1536865234375, -1.044189453125, -0.9346923828125, -0.8251953125, -0.7156982421875, -0.606201171875, -0.4967041015625, -0.38720703125, -0.2777099609375, -0.168212890625, -0.0587158203125, 0.05078125, 0.1602783203125, 0.269775390625, 0.3792724609375, 0.48876953125, 0.5982666015625, 0.707763671875, 0.8172607421875, 0.9267578125, 1.0362548828125, 1.145751953125, 1.2552490234375, 1.36474609375, 1.4742431640625, 1.583740234375, 1.6932373046875, 1.802734375, 1.9122314453125, 2.021728515625, 2.1312255859375, 2.24072265625, 2.3502197265625, 2.459716796875, 2.5692138671875, 2.6787109375, 2.7882080078125, 2.897705078125, 3.0072021484375, 3.11669921875, 3.2261962890625, 3.335693359375, 3.4451904296875, 3.5546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 11.0, 16.0, 28.0, 40.0, 41.0, 86.0, 110.0, 189.0, 281.0, 482.0, 827.0, 1443.0, 2489.0, 4670.0, 8501.0, 15734.0, 30276.0, 59858.0, 129268.0, 311052.0, 267872.0, 107535.0, 51339.0, 25900.0, 13679.0, 7398.0, 4001.0, 2266.0, 1269.0, 741.0, 399.0, 274.0, 151.0, 110.0, 81.0, 40.0, 27.0, 23.0, 8.0, 12.0, 7.0, 5.0, 3.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9676971435546875, -0.936370849609375, -0.9050445556640625, -0.87371826171875, -0.8423919677734375, -0.811065673828125, -0.7797393798828125, -0.7484130859375, -0.7170867919921875, -0.685760498046875, -0.6544342041015625, -0.62310791015625, -0.5917816162109375, -0.560455322265625, -0.5291290283203125, -0.497802734375, -0.4664764404296875, -0.435150146484375, -0.4038238525390625, -0.37249755859375, -0.3411712646484375, -0.309844970703125, -0.2785186767578125, -0.2471923828125, -0.2158660888671875, -0.184539794921875, -0.1532135009765625, -0.12188720703125, -0.0905609130859375, -0.059234619140625, -0.0279083251953125, 0.00341796875, 0.0347442626953125, 0.066070556640625, 0.0973968505859375, 0.12872314453125, 0.1600494384765625, 0.191375732421875, 0.2227020263671875, 0.2540283203125, 0.2853546142578125, 0.316680908203125, 0.3480072021484375, 0.37933349609375, 0.4106597900390625, 0.441986083984375, 0.4733123779296875, 0.504638671875, 0.5359649658203125, 0.567291259765625, 0.5986175537109375, 0.62994384765625, 0.6612701416015625, 0.692596435546875, 0.7239227294921875, 0.7552490234375, 0.7865753173828125, 0.817901611328125, 0.8492279052734375, 0.88055419921875, 0.9118804931640625, 0.943206787109375, 0.9745330810546875, 1.005859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 10.0, 8.0, 13.0, 23.0, 18.0, 33.0, 43.0, 87.0, 135.0, 181.0, 149.0, 82.0, 54.0, 41.0, 23.0, 19.0, 14.0, 14.0, 16.0, 5.0, 5.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003495216369628906, -0.000337306410074234, -0.0003250911831855774, -0.0003128759562969208, -0.00030066072940826416, -0.00028844550251960754, -0.00027623027563095093, -0.0002640150487422943, -0.0002517998218536377, -0.00023958459496498108, -0.00022736936807632446, -0.00021515414118766785, -0.00020293891429901123, -0.00019072368741035461, -0.000178508460521698, -0.00016629323363304138, -0.00015407800674438477, -0.00014186277985572815, -0.00012964755296707153, -0.00011743232607841492, -0.0001052170991897583, -9.300187230110168e-05, -8.078664541244507e-05, -6.857141852378845e-05, -5.6356191635131836e-05, -4.414096474647522e-05, -3.1925737857818604e-05, -1.9710510969161987e-05, -7.495284080505371e-06, 4.719942808151245e-06, 1.693516969680786e-05, 2.9150396585464478e-05, 4.1365623474121094e-05, 5.358085036277771e-05, 6.579607725143433e-05, 7.801130414009094e-05, 9.022653102874756e-05, 0.00010244175791740417, 0.00011465698480606079, 0.0001268722116947174, 0.00013908743858337402, 0.00015130266547203064, 0.00016351789236068726, 0.00017573311924934387, 0.0001879483461380005, 0.0002001635730266571, 0.00021237879991531372, 0.00022459402680397034, 0.00023680925369262695, 0.00024902448058128357, 0.0002612397074699402, 0.0002734549343585968, 0.0002856701612472534, 0.00029788538813591003, 0.00031010061502456665, 0.00032231584191322327, 0.0003345310688018799, 0.0003467462956905365, 0.0003589615225791931, 0.00037117674946784973, 0.00038339197635650635, 0.00039560720324516296, 0.0004078224301338196, 0.0004200376570224762, 0.0004322528839111328]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 14.0, 12.0, 22.0, 37.0, 64.0, 90.0, 134.0, 247.0, 491.0, 1061.0, 2634.0, 6564.0, 18900.0, 58192.0, 208554.0, 489618.0, 182510.0, 51788.0, 17003.0, 6077.0, 2389.0, 1046.0, 433.0, 276.0, 146.0, 80.0, 57.0, 32.0, 20.0, 16.0, 9.0, 8.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4443359375, -1.3917236328125, -1.339111328125, -1.2864990234375, -1.23388671875, -1.1812744140625, -1.128662109375, -1.0760498046875, -1.0234375, -0.9708251953125, -0.918212890625, -0.8656005859375, -0.81298828125, -0.7603759765625, -0.707763671875, -0.6551513671875, -0.6025390625, -0.5499267578125, -0.497314453125, -0.4447021484375, -0.39208984375, -0.3394775390625, -0.286865234375, -0.2342529296875, -0.181640625, -0.1290283203125, -0.076416015625, -0.0238037109375, 0.02880859375, 0.0814208984375, 0.134033203125, 0.1866455078125, 0.2392578125, 0.2918701171875, 0.344482421875, 0.3970947265625, 0.44970703125, 0.5023193359375, 0.554931640625, 0.6075439453125, 0.66015625, 0.7127685546875, 0.765380859375, 0.8179931640625, 0.87060546875, 0.9232177734375, 0.975830078125, 1.0284423828125, 1.0810546875, 1.1336669921875, 1.186279296875, 1.2388916015625, 1.29150390625, 1.3441162109375, 1.396728515625, 1.4493408203125, 1.501953125, 1.5545654296875, 1.607177734375, 1.6597900390625, 1.71240234375, 1.7650146484375, 1.817626953125, 1.8702392578125, 1.9228515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 5.0, 5.0, 4.0, 7.0, 8.0, 13.0, 22.0, 25.0, 23.0, 30.0, 29.0, 37.0, 37.0, 47.0, 63.0, 89.0, 73.0, 77.0, 58.0, 61.0, 48.0, 44.0, 29.0, 25.0, 26.0, 26.0, 20.0, 15.0, 7.0, 5.0, 1.0, 7.0, 6.0, 7.0, 5.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9287109375, -0.8962249755859375, -0.863739013671875, -0.8312530517578125, -0.79876708984375, -0.7662811279296875, -0.733795166015625, -0.7013092041015625, -0.6688232421875, -0.6363372802734375, -0.603851318359375, -0.5713653564453125, -0.53887939453125, -0.5063934326171875, -0.473907470703125, -0.4414215087890625, -0.408935546875, -0.3764495849609375, -0.343963623046875, -0.3114776611328125, -0.27899169921875, -0.2465057373046875, -0.214019775390625, -0.1815338134765625, -0.1490478515625, -0.1165618896484375, -0.084075927734375, -0.0515899658203125, -0.01910400390625, 0.0133819580078125, 0.045867919921875, 0.0783538818359375, 0.11083984375, 0.1433258056640625, 0.175811767578125, 0.2082977294921875, 0.24078369140625, 0.2732696533203125, 0.305755615234375, 0.3382415771484375, 0.3707275390625, 0.4032135009765625, 0.435699462890625, 0.4681854248046875, 0.50067138671875, 0.5331573486328125, 0.565643310546875, 0.5981292724609375, 0.630615234375, 0.6631011962890625, 0.695587158203125, 0.7280731201171875, 0.76055908203125, 0.7930450439453125, 0.825531005859375, 0.8580169677734375, 0.8905029296875, 0.9229888916015625, 0.955474853515625, 0.9879608154296875, 1.02044677734375, 1.0529327392578125, 1.085418701171875, 1.1179046630859375, 1.150390625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 7.0, 21.0, 39.0, 60.0, 88.0, 129.0, 142.0, 152.0, 132.0, 89.0, 54.0, 32.0, 21.0, 22.0, 8.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.992462158203125, -9.36529541015625, -8.738128662109375, -8.1109619140625, -7.483795166015625, -6.85662841796875, -6.229461193084717, -5.602294445037842, -4.975127696990967, -4.347960948944092, -3.720794200897217, -3.0936272144317627, -2.4664604663848877, -1.8392937183380127, -1.2121267318725586, -0.5849599838256836, 0.042206764221191406, 0.6693735718727112, 1.296540379524231, 1.9237072467803955, 2.5508739948272705, 3.1780407428741455, 3.8052077293395996, 4.432374477386475, 5.05954122543335, 5.686707973480225, 6.3138747215271, 6.941041946411133, 7.568208694458008, 8.195375442504883, 8.822542190551758, 9.449708938598633, 10.076875686645508, 10.704042434692383, 11.331209182739258, 11.958375930786133, 12.585542678833008, 13.212709426879883, 13.839876174926758, 14.467042922973633, 15.094209671020508, 15.721376419067383, 16.348543167114258, 16.975709915161133, 17.602876663208008, 18.230043411254883, 18.857210159301758, 19.484376907348633, 20.11154556274414, 20.738712310791016, 21.36587905883789, 21.993045806884766, 22.62021255493164, 23.247379302978516, 23.87454605102539, 24.501712799072266, 25.12887954711914, 25.756046295166016, 26.38321304321289, 27.010379791259766, 27.63754653930664, 28.264713287353516, 28.89188003540039, 29.519046783447266, 30.14621353149414]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 11.0, 6.0, 6.0, 13.0, 10.0, 11.0, 17.0, 14.0, 37.0, 23.0, 29.0, 35.0, 38.0, 32.0, 37.0, 26.0, 32.0, 37.0, 36.0, 30.0, 36.0, 32.0, 42.0, 43.0, 38.0, 39.0, 23.0, 31.0, 20.0, 16.0, 23.0, 14.0, 22.0, 17.0, 14.0, 14.0, 13.0, 17.0, 10.0, 7.0, 6.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.290658950805664, -9.01656436920166, -8.742469787597656, -8.468375205993652, -8.194280624389648, -7.920185565948486, -7.646090507507324, -7.37199592590332, -7.097901344299316, -6.8238067626953125, -6.549712181091309, -6.2756171226501465, -6.001522541046143, -5.727427959442139, -5.453332901000977, -5.179238319396973, -4.905143737792969, -4.631049156188965, -4.356954574584961, -4.082859516143799, -3.808764934539795, -3.534670352935791, -3.260575532913208, -2.986480712890625, -2.712386131286621, -2.438291549682617, -2.164196729660034, -1.8901020288467407, -1.6160073280334473, -1.3419126272201538, -1.0678179264068604, -0.7937232255935669, -0.519627571105957, -0.24553287029266357, 0.028561830520629883, 0.30265653133392334, 0.5767512321472168, 0.8508459329605103, 1.1249406337738037, 1.3990353345870972, 1.6731300354003906, 1.947224736213684, 2.2213194370269775, 2.4954142570495605, 2.7695088386535645, 3.0436034202575684, 3.3176982402801514, 3.5917930603027344, 3.8658876419067383, 4.139982223510742, 4.414076805114746, 4.688171863555908, 4.962266445159912, 5.236361026763916, 5.510456085205078, 5.784550666809082, 6.058645248413086, 6.33273983001709, 6.606834411621094, 6.880929470062256, 7.15502405166626, 7.429118633270264, 7.703213691711426, 7.97730827331543, 8.251402854919434]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 20.0, 12.0, 23.0, 27.0, 36.0, 65.0, 74.0, 107.0, 195.0, 288.0, 396.0, 625.0, 1075.0, 1674.0, 2892.0, 5006.0, 8970.0, 17515.0, 35910.0, 80716.0, 211024.0, 781850.0, 2164238.0, 571941.0, 172689.0, 69915.0, 32015.0, 15818.0, 8089.0, 4486.0, 2553.0, 1472.0, 968.0, 532.0, 358.0, 214.0, 152.0, 102.0, 68.0, 47.0, 41.0, 19.0, 21.0, 9.0, 7.0, 8.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0], "bins": [-2.39453125, -2.322845458984375, -2.25115966796875, -2.179473876953125, -2.1077880859375, -2.036102294921875, -1.96441650390625, -1.892730712890625, -1.821044921875, -1.749359130859375, -1.67767333984375, -1.605987548828125, -1.5343017578125, -1.462615966796875, -1.39093017578125, -1.319244384765625, -1.24755859375, -1.175872802734375, -1.10418701171875, -1.032501220703125, -0.9608154296875, -0.889129638671875, -0.81744384765625, -0.745758056640625, -0.674072265625, -0.602386474609375, -0.53070068359375, -0.459014892578125, -0.3873291015625, -0.315643310546875, -0.24395751953125, -0.172271728515625, -0.1005859375, -0.028900146484375, 0.04278564453125, 0.114471435546875, 0.1861572265625, 0.257843017578125, 0.32952880859375, 0.401214599609375, 0.472900390625, 0.544586181640625, 0.61627197265625, 0.687957763671875, 0.7596435546875, 0.831329345703125, 0.90301513671875, 0.974700927734375, 1.04638671875, 1.118072509765625, 1.18975830078125, 1.261444091796875, 1.3331298828125, 1.404815673828125, 1.47650146484375, 1.548187255859375, 1.619873046875, 1.691558837890625, 1.76324462890625, 1.834930419921875, 1.9066162109375, 1.978302001953125, 2.04998779296875, 2.121673583984375, 2.193359375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 6.0, 17.0, 9.0, 26.0, 17.0, 16.0, 27.0, 34.0, 28.0, 30.0, 40.0, 39.0, 38.0, 39.0, 30.0, 42.0, 49.0, 37.0, 53.0, 50.0, 40.0, 47.0, 35.0, 31.0, 30.0, 29.0, 24.0, 22.0, 13.0, 11.0, 13.0, 12.0, 21.0, 6.0, 6.0, 8.0, 2.0, 2.0, 2.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.3735809326171875, -1.327239990234375, -1.2808990478515625, -1.23455810546875, -1.1882171630859375, -1.141876220703125, -1.0955352783203125, -1.0491943359375, -1.0028533935546875, -0.956512451171875, -0.9101715087890625, -0.86383056640625, -0.8174896240234375, -0.771148681640625, -0.7248077392578125, -0.678466796875, -0.6321258544921875, -0.585784912109375, -0.5394439697265625, -0.49310302734375, -0.4467620849609375, -0.400421142578125, -0.3540802001953125, -0.3077392578125, -0.2613983154296875, -0.215057373046875, -0.1687164306640625, -0.12237548828125, -0.0760345458984375, -0.029693603515625, 0.0166473388671875, 0.06298828125, 0.1093292236328125, 0.155670166015625, 0.2020111083984375, 0.24835205078125, 0.2946929931640625, 0.341033935546875, 0.3873748779296875, 0.4337158203125, 0.4800567626953125, 0.526397705078125, 0.5727386474609375, 0.61907958984375, 0.6654205322265625, 0.711761474609375, 0.7581024169921875, 0.804443359375, 0.8507843017578125, 0.897125244140625, 0.9434661865234375, 0.98980712890625, 1.0361480712890625, 1.082489013671875, 1.1288299560546875, 1.1751708984375, 1.2215118408203125, 1.267852783203125, 1.3141937255859375, 1.36053466796875, 1.4068756103515625, 1.453216552734375, 1.4995574951171875, 1.5458984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 5.0, 13.0, 8.0, 22.0, 37.0, 41.0, 79.0, 110.0, 174.0, 298.0, 513.0, 845.0, 1588.0, 2792.0, 5538.0, 11355.0, 24782.0, 57065.0, 142546.0, 421188.0, 1901029.0, 1156570.0, 283404.0, 103607.0, 42400.0, 19189.0, 8994.0, 4551.0, 2320.0, 1234.0, 762.0, 440.0, 274.0, 182.0, 107.0, 75.0, 51.0, 34.0, 18.0, 15.0, 12.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.193359375, -3.096099853515625, -2.99884033203125, -2.901580810546875, -2.8043212890625, -2.707061767578125, -2.60980224609375, -2.512542724609375, -2.415283203125, -2.318023681640625, -2.22076416015625, -2.123504638671875, -2.0262451171875, -1.928985595703125, -1.83172607421875, -1.734466552734375, -1.63720703125, -1.539947509765625, -1.44268798828125, -1.345428466796875, -1.2481689453125, -1.150909423828125, -1.05364990234375, -0.956390380859375, -0.859130859375, -0.761871337890625, -0.66461181640625, -0.567352294921875, -0.4700927734375, -0.372833251953125, -0.27557373046875, -0.178314208984375, -0.0810546875, 0.016204833984375, 0.11346435546875, 0.210723876953125, 0.3079833984375, 0.405242919921875, 0.50250244140625, 0.599761962890625, 0.697021484375, 0.794281005859375, 0.89154052734375, 0.988800048828125, 1.0860595703125, 1.183319091796875, 1.28057861328125, 1.377838134765625, 1.47509765625, 1.572357177734375, 1.66961669921875, 1.766876220703125, 1.8641357421875, 1.961395263671875, 2.05865478515625, 2.155914306640625, 2.253173828125, 2.350433349609375, 2.44769287109375, 2.544952392578125, 2.6422119140625, 2.739471435546875, 2.83673095703125, 2.933990478515625, 3.03125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 11.0, 16.0, 18.0, 20.0, 18.0, 26.0, 41.0, 45.0, 74.0, 114.0, 153.0, 222.0, 305.0, 516.0, 785.0, 576.0, 323.0, 227.0, 164.0, 107.0, 67.0, 68.0, 50.0, 35.0, 25.0, 16.0, 10.0, 9.0, 10.0, 9.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.25, -3.136474609375, -3.02294921875, -2.909423828125, -2.7958984375, -2.682373046875, -2.56884765625, -2.455322265625, -2.341796875, -2.228271484375, -2.11474609375, -2.001220703125, -1.8876953125, -1.774169921875, -1.66064453125, -1.547119140625, -1.43359375, -1.320068359375, -1.20654296875, -1.093017578125, -0.9794921875, -0.865966796875, -0.75244140625, -0.638916015625, -0.525390625, -0.411865234375, -0.29833984375, -0.184814453125, -0.0712890625, 0.042236328125, 0.15576171875, 0.269287109375, 0.3828125, 0.496337890625, 0.60986328125, 0.723388671875, 0.8369140625, 0.950439453125, 1.06396484375, 1.177490234375, 1.291015625, 1.404541015625, 1.51806640625, 1.631591796875, 1.7451171875, 1.858642578125, 1.97216796875, 2.085693359375, 2.19921875, 2.312744140625, 2.42626953125, 2.539794921875, 2.6533203125, 2.766845703125, 2.88037109375, 2.993896484375, 3.107421875, 3.220947265625, 3.33447265625, 3.447998046875, 3.5615234375, 3.675048828125, 3.78857421875, 3.902099609375, 4.015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 10.0, 14.0, 15.0, 38.0, 51.0, 86.0, 103.0, 129.0, 132.0, 110.0, 102.0, 78.0, 42.0, 39.0, 20.0, 8.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-28.697418212890625, -28.034278869628906, -27.371139526367188, -26.70800018310547, -26.04486083984375, -25.3817195892334, -24.71858024597168, -24.05544090270996, -23.392301559448242, -22.729162216186523, -22.066022872924805, -21.402883529663086, -20.739742279052734, -20.076602935791016, -19.413463592529297, -18.750324249267578, -18.08718490600586, -17.42404556274414, -16.760906219482422, -16.097766876220703, -15.434626579284668, -14.77148723602295, -14.108346939086914, -13.445207595825195, -12.782068252563477, -12.118928909301758, -11.455789566040039, -10.792649269104004, -10.129509925842285, -9.466370582580566, -8.803230285644531, -8.140090942382812, -7.476951599121094, -6.813812255859375, -6.150672435760498, -5.487532615661621, -4.824393272399902, -4.161253929138184, -3.4981141090393066, -2.8349742889404297, -2.171834945678711, -1.508695363998413, -0.8455557823181152, -0.18241620063781738, 0.48072338104248047, 1.1438629627227783, 1.8070025444030762, 2.470142364501953, 3.133281707763672, 3.7964212894439697, 4.459560871124268, 5.1227006912231445, 5.785840034484863, 6.448979377746582, 7.112119197845459, 7.775259017944336, 8.438398361206055, 9.101537704467773, 9.764677047729492, 10.427817344665527, 11.090956687927246, 11.754096031188965, 12.417236328125, 13.080375671386719, 13.743515014648438]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 3.0, 6.0, 8.0, 12.0, 16.0, 19.0, 10.0, 17.0, 24.0, 25.0, 26.0, 28.0, 34.0, 38.0, 26.0, 20.0, 40.0, 32.0, 39.0, 49.0, 35.0, 43.0, 44.0, 33.0, 40.0, 41.0, 32.0, 28.0, 37.0, 21.0, 8.0, 24.0, 17.0, 22.0, 17.0, 13.0, 8.0, 12.0, 10.0, 8.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.769560813903809, -8.477986335754395, -8.18641185760498, -7.894836902618408, -7.603261947631836, -7.311687469482422, -7.020112991333008, -6.728538513183594, -6.4369635581970215, -6.145389080047607, -5.853814125061035, -5.562239646911621, -5.270665168762207, -4.979090213775635, -4.687515735626221, -4.395940780639648, -4.104366302490234, -3.812791585922241, -3.521216869354248, -3.229642391204834, -2.938067674636841, -2.6464929580688477, -2.3549184799194336, -2.0633437633514404, -1.7717690467834473, -1.480194330215454, -1.1886197328567505, -0.8970450758934021, -0.6054704189300537, -0.31389570236206055, -0.022321105003356934, 0.2692534923553467, 0.5608272552490234, 0.8524019122123718, 1.1439765691757202, 1.4355511665344238, 1.727125883102417, 2.01870059967041, 2.310275077819824, 2.6018497943878174, 2.8934245109558105, 3.1849992275238037, 3.476573944091797, 3.768148422241211, 4.059722900390625, 4.351297855377197, 4.642872333526611, 4.934447288513184, 5.226021766662598, 5.517596244812012, 5.809171199798584, 6.100745677947998, 6.39232063293457, 6.683895111083984, 6.975469589233398, 7.2670440673828125, 7.558619022369385, 7.850193500518799, 8.141768455505371, 8.433342933654785, 8.7249174118042, 9.01649284362793, 9.308067321777344, 9.599641799926758, 9.891216278076172]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 11.0, 16.0, 16.0, 42.0, 36.0, 84.0, 141.0, 202.0, 281.0, 395.0, 687.0, 937.0, 1458.0, 2122.0, 3332.0, 5097.0, 8104.0, 13892.0, 25153.0, 52236.0, 124719.0, 273903.0, 284112.0, 132206.0, 54988.0, 26464.0, 14158.0, 8351.0, 5306.0, 3368.0, 2231.0, 1475.0, 1019.0, 659.0, 437.0, 320.0, 194.0, 164.0, 76.0, 57.0, 37.0, 29.0, 17.0, 10.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -2.0853118896484375, -2.022186279296875, -1.9590606689453125, -1.89593505859375, -1.8328094482421875, -1.769683837890625, -1.7065582275390625, -1.6434326171875, -1.5803070068359375, -1.517181396484375, -1.4540557861328125, -1.39093017578125, -1.3278045654296875, -1.264678955078125, -1.2015533447265625, -1.138427734375, -1.0753021240234375, -1.012176513671875, -0.9490509033203125, -0.88592529296875, -0.8227996826171875, -0.759674072265625, -0.6965484619140625, -0.6334228515625, -0.5702972412109375, -0.507171630859375, -0.4440460205078125, -0.38092041015625, -0.3177947998046875, -0.254669189453125, -0.1915435791015625, -0.12841796875, -0.0652923583984375, -0.002166748046875, 0.0609588623046875, 0.12408447265625, 0.1872100830078125, 0.250335693359375, 0.3134613037109375, 0.3765869140625, 0.4397125244140625, 0.502838134765625, 0.5659637451171875, 0.62908935546875, 0.6922149658203125, 0.755340576171875, 0.8184661865234375, 0.881591796875, 0.9447174072265625, 1.007843017578125, 1.0709686279296875, 1.13409423828125, 1.1972198486328125, 1.260345458984375, 1.3234710693359375, 1.3865966796875, 1.4497222900390625, 1.512847900390625, 1.5759735107421875, 1.63909912109375, 1.7022247314453125, 1.765350341796875, 1.8284759521484375, 1.8916015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 9.0, 5.0, 12.0, 16.0, 20.0, 10.0, 18.0, 17.0, 30.0, 22.0, 38.0, 53.0, 45.0, 33.0, 50.0, 52.0, 42.0, 51.0, 53.0, 48.0, 46.0, 41.0, 33.0, 36.0, 31.0, 40.0, 23.0, 15.0, 19.0, 29.0, 9.0, 7.0, 9.0, 10.0, 13.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.658203125, -1.6053314208984375, -1.552459716796875, -1.4995880126953125, -1.44671630859375, -1.3938446044921875, -1.340972900390625, -1.2881011962890625, -1.2352294921875, -1.1823577880859375, -1.129486083984375, -1.0766143798828125, -1.02374267578125, -0.9708709716796875, -0.917999267578125, -0.8651275634765625, -0.812255859375, -0.7593841552734375, -0.706512451171875, -0.6536407470703125, -0.60076904296875, -0.5478973388671875, -0.495025634765625, -0.4421539306640625, -0.3892822265625, -0.3364105224609375, -0.283538818359375, -0.2306671142578125, -0.17779541015625, -0.1249237060546875, -0.072052001953125, -0.0191802978515625, 0.03369140625, 0.0865631103515625, 0.139434814453125, 0.1923065185546875, 0.24517822265625, 0.2980499267578125, 0.350921630859375, 0.4037933349609375, 0.4566650390625, 0.5095367431640625, 0.562408447265625, 0.6152801513671875, 0.66815185546875, 0.7210235595703125, 0.773895263671875, 0.8267669677734375, 0.879638671875, 0.9325103759765625, 0.985382080078125, 1.0382537841796875, 1.09112548828125, 1.1439971923828125, 1.196868896484375, 1.2497406005859375, 1.3026123046875, 1.3554840087890625, 1.408355712890625, 1.4612274169921875, 1.51409912109375, 1.5669708251953125, 1.619842529296875, 1.6727142333984375, 1.7255859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 5.0, 8.0, 12.0, 14.0, 27.0, 39.0, 61.0, 94.0, 149.0, 170.0, 297.0, 458.0, 789.0, 1407.0, 2445.0, 4173.0, 7442.0, 14038.0, 27424.0, 63894.0, 170449.0, 338594.0, 243915.0, 94651.0, 37597.0, 18080.0, 9651.0, 5320.0, 3001.0, 1686.0, 1043.0, 592.0, 371.0, 229.0, 135.0, 88.0, 55.0, 38.0, 38.0, 30.0, 13.0, 9.0, 6.0, 7.0, 5.0, 7.0, 3.0, 1.0, 2.0], "bins": [-2.623046875, -2.55157470703125, -2.4801025390625, -2.40863037109375, -2.337158203125, -2.26568603515625, -2.1942138671875, -2.12274169921875, -2.05126953125, -1.97979736328125, -1.9083251953125, -1.83685302734375, -1.765380859375, -1.69390869140625, -1.6224365234375, -1.55096435546875, -1.4794921875, -1.40802001953125, -1.3365478515625, -1.26507568359375, -1.193603515625, -1.12213134765625, -1.0506591796875, -0.97918701171875, -0.90771484375, -0.83624267578125, -0.7647705078125, -0.69329833984375, -0.621826171875, -0.55035400390625, -0.4788818359375, -0.40740966796875, -0.3359375, -0.26446533203125, -0.1929931640625, -0.12152099609375, -0.050048828125, 0.02142333984375, 0.0928955078125, 0.16436767578125, 0.23583984375, 0.30731201171875, 0.3787841796875, 0.45025634765625, 0.521728515625, 0.59320068359375, 0.6646728515625, 0.73614501953125, 0.8076171875, 0.87908935546875, 0.9505615234375, 1.02203369140625, 1.093505859375, 1.16497802734375, 1.2364501953125, 1.30792236328125, 1.37939453125, 1.45086669921875, 1.5223388671875, 1.59381103515625, 1.665283203125, 1.73675537109375, 1.8082275390625, 1.87969970703125, 1.951171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 9.0, 13.0, 13.0, 11.0, 23.0, 21.0, 30.0, 27.0, 24.0, 29.0, 26.0, 31.0, 37.0, 33.0, 29.0, 36.0, 37.0, 49.0, 50.0, 37.0, 39.0, 33.0, 30.0, 29.0, 41.0, 29.0, 22.0, 22.0, 20.0, 32.0, 20.0, 19.0, 11.0, 15.0, 10.0, 8.0, 11.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.21875, -4.093963623046875, -3.96917724609375, -3.844390869140625, -3.7196044921875, -3.594818115234375, -3.47003173828125, -3.345245361328125, -3.220458984375, -3.095672607421875, -2.97088623046875, -2.846099853515625, -2.7213134765625, -2.596527099609375, -2.47174072265625, -2.346954345703125, -2.22216796875, -2.097381591796875, -1.97259521484375, -1.847808837890625, -1.7230224609375, -1.598236083984375, -1.47344970703125, -1.348663330078125, -1.223876953125, -1.099090576171875, -0.97430419921875, -0.849517822265625, -0.7247314453125, -0.599945068359375, -0.47515869140625, -0.350372314453125, -0.2255859375, -0.100799560546875, 0.02398681640625, 0.148773193359375, 0.2735595703125, 0.398345947265625, 0.52313232421875, 0.647918701171875, 0.772705078125, 0.897491455078125, 1.02227783203125, 1.147064208984375, 1.2718505859375, 1.396636962890625, 1.52142333984375, 1.646209716796875, 1.77099609375, 1.895782470703125, 2.02056884765625, 2.145355224609375, 2.2701416015625, 2.394927978515625, 2.51971435546875, 2.644500732421875, 2.769287109375, 2.894073486328125, 3.01885986328125, 3.143646240234375, 3.2684326171875, 3.393218994140625, 3.51800537109375, 3.642791748046875, 3.767578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 9.0, 15.0, 18.0, 13.0, 29.0, 34.0, 65.0, 104.0, 147.0, 241.0, 341.0, 567.0, 852.0, 1336.0, 1961.0, 3396.0, 5485.0, 8954.0, 15323.0, 26728.0, 47638.0, 89128.0, 163309.0, 235491.0, 196975.0, 111445.0, 59242.0, 32917.0, 18762.0, 10725.0, 6436.0, 3949.0, 2556.0, 1542.0, 981.0, 629.0, 402.0, 265.0, 172.0, 118.0, 81.0, 45.0, 32.0, 35.0, 16.0, 18.0, 12.0, 6.0, 7.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7021484375, -0.6799850463867188, -0.6578216552734375, -0.6356582641601562, -0.613494873046875, -0.5913314819335938, -0.5691680908203125, -0.5470046997070312, -0.52484130859375, -0.5026779174804688, -0.4805145263671875, -0.45835113525390625, -0.436187744140625, -0.41402435302734375, -0.3918609619140625, -0.36969757080078125, -0.3475341796875, -0.32537078857421875, -0.3032073974609375, -0.28104400634765625, -0.258880615234375, -0.23671722412109375, -0.2145538330078125, -0.19239044189453125, -0.17022705078125, -0.14806365966796875, -0.1259002685546875, -0.10373687744140625, -0.081573486328125, -0.05941009521484375, -0.0372467041015625, -0.01508331298828125, 0.007080078125, 0.02924346923828125, 0.0514068603515625, 0.07357025146484375, 0.095733642578125, 0.11789703369140625, 0.1400604248046875, 0.16222381591796875, 0.18438720703125, 0.20655059814453125, 0.2287139892578125, 0.25087738037109375, 0.273040771484375, 0.29520416259765625, 0.3173675537109375, 0.33953094482421875, 0.3616943359375, 0.38385772705078125, 0.4060211181640625, 0.42818450927734375, 0.450347900390625, 0.47251129150390625, 0.4946746826171875, 0.5168380737304688, 0.53900146484375, 0.5611648559570312, 0.5833282470703125, 0.6054916381835938, 0.627655029296875, 0.6498184204101562, 0.6719818115234375, 0.6941452026367188, 0.71630859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 5.0, 3.0, 4.0, 6.0, 8.0, 12.0, 20.0, 25.0, 35.0, 56.0, 88.0, 104.0, 129.0, 145.0, 96.0, 82.0, 35.0, 37.0, 24.0, 19.0, 15.0, 8.0, 9.0, 7.0, 10.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00032067298889160156, -0.0003102831542491913, -0.000299893319606781, -0.00028950348496437073, -0.00027911365032196045, -0.00026872381567955017, -0.0002583339810371399, -0.0002479441463947296, -0.00023755431175231934, -0.00022716447710990906, -0.00021677464246749878, -0.0002063848078250885, -0.00019599497318267822, -0.00018560513854026794, -0.00017521530389785767, -0.0001648254692554474, -0.0001544356346130371, -0.00014404579997062683, -0.00013365596532821655, -0.00012326613068580627, -0.000112876296043396, -0.00010248646140098572, -9.209662675857544e-05, -8.170679211616516e-05, -7.131695747375488e-05, -6.0927122831344604e-05, -5.0537288188934326e-05, -4.014745354652405e-05, -2.975761890411377e-05, -1.936778426170349e-05, -8.977949619293213e-06, 1.4118850231170654e-06, 1.1801719665527344e-05, 2.2191554307937622e-05, 3.25813889503479e-05, 4.297122359275818e-05, 5.336105823516846e-05, 6.375089287757874e-05, 7.414072751998901e-05, 8.453056216239929e-05, 9.492039680480957e-05, 0.00010531023144721985, 0.00011570006608963013, 0.0001260899007320404, 0.00013647973537445068, 0.00014686957001686096, 0.00015725940465927124, 0.00016764923930168152, 0.0001780390739440918, 0.00018842890858650208, 0.00019881874322891235, 0.00020920857787132263, 0.0002195984125137329, 0.0002299882471561432, 0.00024037808179855347, 0.00025076791644096375, 0.000261157751083374, 0.0002715475857257843, 0.0002819374203681946, 0.00029232725501060486, 0.00030271708965301514, 0.0003131069242954254, 0.0003234967589378357, 0.00033388659358024597, 0.00034427642822265625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 10.0, 4.0, 12.0, 14.0, 25.0, 36.0, 58.0, 104.0, 150.0, 237.0, 367.0, 608.0, 1012.0, 1767.0, 3138.0, 5514.0, 10002.0, 18346.0, 34348.0, 65574.0, 124398.0, 203298.0, 227634.0, 161097.0, 88826.0, 47006.0, 24732.0, 13290.0, 7326.0, 4055.0, 2213.0, 1334.0, 758.0, 494.0, 280.0, 182.0, 90.0, 73.0, 48.0, 42.0, 14.0, 17.0, 8.0, 7.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.77099609375, -0.7470779418945312, -0.7231597900390625, -0.6992416381835938, -0.675323486328125, -0.6514053344726562, -0.6274871826171875, -0.6035690307617188, -0.57965087890625, -0.5557327270507812, -0.5318145751953125, -0.5078964233398438, -0.483978271484375, -0.46006011962890625, -0.4361419677734375, -0.41222381591796875, -0.3883056640625, -0.36438751220703125, -0.3404693603515625, -0.31655120849609375, -0.292633056640625, -0.26871490478515625, -0.2447967529296875, -0.22087860107421875, -0.19696044921875, -0.17304229736328125, -0.1491241455078125, -0.12520599365234375, -0.101287841796875, -0.07736968994140625, -0.0534515380859375, -0.02953338623046875, -0.005615234375, 0.01830291748046875, 0.0422210693359375, 0.06613922119140625, 0.090057373046875, 0.11397552490234375, 0.1378936767578125, 0.16181182861328125, 0.18572998046875, 0.20964813232421875, 0.2335662841796875, 0.25748443603515625, 0.281402587890625, 0.30532073974609375, 0.3292388916015625, 0.35315704345703125, 0.3770751953125, 0.40099334716796875, 0.4249114990234375, 0.44882965087890625, 0.472747802734375, 0.49666595458984375, 0.5205841064453125, 0.5445022583007812, 0.56842041015625, 0.5923385620117188, 0.6162567138671875, 0.6401748657226562, 0.664093017578125, 0.6880111694335938, 0.7119293212890625, 0.7358474731445312, 0.759765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 3.0, 3.0, 4.0, 8.0, 9.0, 13.0, 10.0, 14.0, 12.0, 16.0, 18.0, 23.0, 45.0, 41.0, 53.0, 52.0, 53.0, 69.0, 74.0, 68.0, 59.0, 51.0, 50.0, 52.0, 41.0, 31.0, 19.0, 14.0, 16.0, 18.0, 11.0, 8.0, 9.0, 6.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.267578125, -1.2347640991210938, -1.2019500732421875, -1.1691360473632812, -1.136322021484375, -1.1035079956054688, -1.0706939697265625, -1.0378799438476562, -1.00506591796875, -0.9722518920898438, -0.9394378662109375, -0.9066238403320312, -0.873809814453125, -0.8409957885742188, -0.8081817626953125, -0.7753677368164062, -0.7425537109375, -0.7097396850585938, -0.6769256591796875, -0.6441116333007812, -0.611297607421875, -0.5784835815429688, -0.5456695556640625, -0.5128555297851562, -0.48004150390625, -0.44722747802734375, -0.4144134521484375, -0.38159942626953125, -0.348785400390625, -0.31597137451171875, -0.2831573486328125, -0.25034332275390625, -0.217529296875, -0.18471527099609375, -0.1519012451171875, -0.11908721923828125, -0.086273193359375, -0.05345916748046875, -0.0206451416015625, 0.01216888427734375, 0.04498291015625, 0.07779693603515625, 0.1106109619140625, 0.14342498779296875, 0.176239013671875, 0.20905303955078125, 0.2418670654296875, 0.27468109130859375, 0.3074951171875, 0.34030914306640625, 0.3731231689453125, 0.40593719482421875, 0.438751220703125, 0.47156524658203125, 0.5043792724609375, 0.5371932983398438, 0.57000732421875, 0.6028213500976562, 0.6356353759765625, 0.6684494018554688, 0.701263427734375, 0.7340774536132812, 0.7668914794921875, 0.7997055053710938, 0.83251953125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 9.0, 19.0, 39.0, 81.0, 130.0, 149.0, 200.0, 156.0, 122.0, 51.0, 26.0, 11.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.805679321289062, -15.066817283630371, -14.32795524597168, -13.589094161987305, -12.850232124328613, -12.111370086669922, -11.372509002685547, -10.633646965026855, -9.894784927368164, -9.155922889709473, -8.417060852050781, -7.678199768066406, -6.939337730407715, -6.200475692749023, -5.46161413192749, -4.722752571105957, -3.9838905334472656, -3.2450287342071533, -2.506166934967041, -1.7673051357269287, -1.0284433364868164, -0.2895815372467041, 0.4492802619934082, 1.1881418228149414, 1.9270038604736328, 2.665865659713745, 3.4047274589538574, 4.143589019775391, 4.882451057434082, 5.621313095092773, 6.360174655914307, 7.09903621673584, 7.837896347045898, 8.57675838470459, 9.315620422363281, 10.054481506347656, 10.793343544006348, 11.532205581665039, 12.271066665649414, 13.009928703308105, 13.748790740966797, 14.487652778625488, 15.22651481628418, 15.965375900268555, 16.704238891601562, 17.443099975585938, 18.181961059570312, 18.920822143554688, 19.659685134887695, 20.39854621887207, 21.137409210205078, 21.876270294189453, 22.615131378173828, 23.353994369506836, 24.09285545349121, 24.83171844482422, 25.570579528808594, 26.30944061279297, 27.048303604125977, 27.78716468811035, 28.52602767944336, 29.264888763427734, 30.00374984741211, 30.742610931396484, 31.481473922729492]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 13.0, 13.0, 12.0, 22.0, 20.0, 25.0, 24.0, 45.0, 28.0, 30.0, 39.0, 43.0, 33.0, 40.0, 40.0, 36.0, 40.0, 36.0, 36.0, 40.0, 36.0, 42.0, 34.0, 28.0, 32.0, 26.0, 30.0, 23.0, 14.0, 17.0, 16.0, 16.0, 10.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.92996597290039, -12.569768905639648, -12.209572792053223, -11.84937572479248, -11.489179611206055, -11.128982543945312, -10.76878547668457, -10.408589363098145, -10.048393249511719, -9.688196182250977, -9.32800006866455, -8.967803001403809, -8.607606887817383, -8.24740982055664, -7.887213230133057, -7.527016639709473, -7.1668195724487305, -6.8066229820251465, -6.4464263916015625, -6.08622932434082, -5.7260332107543945, -5.365836143493652, -5.005639553070068, -4.645442962646484, -4.2852463722229, -3.9250497817993164, -3.5648531913757324, -3.2046563625335693, -2.8444597721099854, -2.4842631816864014, -2.1240663528442383, -1.7638697624206543, -1.403672218322754, -1.04347562789917, -0.6832789182662964, -0.32308220863342285, 0.03711438179016113, 0.3973109722137451, 0.7575078010559082, 1.1177043914794922, 1.4779009819030762, 1.8380975723266602, 2.198294162750244, 2.5584909915924072, 2.918687582015991, 3.278884172439575, 3.6390810012817383, 3.9992775917053223, 4.359474182128906, 4.71967077255249, 5.079867362976074, 5.440064430236816, 5.800260543823242, 6.160457611083984, 6.520654201507568, 6.880850791931152, 7.241047382354736, 7.60124397277832, 7.961440563201904, 8.321637153625488, 8.68183422088623, 9.042030334472656, 9.402227401733398, 9.76242446899414, 10.122620582580566]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 13.0, 12.0, 13.0, 26.0, 25.0, 47.0, 75.0, 89.0, 156.0, 235.0, 361.0, 607.0, 1034.0, 2019.0, 3895.0, 7796.0, 17077.0, 41305.0, 109771.0, 348469.0, 1485683.0, 1603979.0, 375192.0, 117300.0, 43801.0, 18271.0, 8307.0, 3971.0, 2004.0, 1132.0, 610.0, 366.0, 233.0, 135.0, 82.0, 58.0, 46.0, 29.0, 21.0, 13.0, 8.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01171875, -2.928131103515625, -2.84454345703125, -2.760955810546875, -2.6773681640625, -2.593780517578125, -2.51019287109375, -2.426605224609375, -2.343017578125, -2.259429931640625, -2.17584228515625, -2.092254638671875, -2.0086669921875, -1.925079345703125, -1.84149169921875, -1.757904052734375, -1.67431640625, -1.590728759765625, -1.50714111328125, -1.423553466796875, -1.3399658203125, -1.256378173828125, -1.17279052734375, -1.089202880859375, -1.005615234375, -0.922027587890625, -0.83843994140625, -0.754852294921875, -0.6712646484375, -0.587677001953125, -0.50408935546875, -0.420501708984375, -0.3369140625, -0.253326416015625, -0.16973876953125, -0.086151123046875, -0.0025634765625, 0.081024169921875, 0.16461181640625, 0.248199462890625, 0.331787109375, 0.415374755859375, 0.49896240234375, 0.582550048828125, 0.6661376953125, 0.749725341796875, 0.83331298828125, 0.916900634765625, 1.00048828125, 1.084075927734375, 1.16766357421875, 1.251251220703125, 1.3348388671875, 1.418426513671875, 1.50201416015625, 1.585601806640625, 1.669189453125, 1.752777099609375, 1.83636474609375, 1.919952392578125, 2.0035400390625, 2.087127685546875, 2.17071533203125, 2.254302978515625, 2.337890625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 7.0, 8.0, 10.0, 12.0, 7.0, 16.0, 16.0, 18.0, 18.0, 23.0, 33.0, 31.0, 33.0, 37.0, 43.0, 45.0, 48.0, 49.0, 40.0, 35.0, 41.0, 38.0, 39.0, 34.0, 45.0, 32.0, 30.0, 28.0, 28.0, 21.0, 15.0, 19.0, 17.0, 13.0, 9.0, 12.0, 10.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.34375, -1.29754638671875, -1.2513427734375, -1.20513916015625, -1.158935546875, -1.11273193359375, -1.0665283203125, -1.02032470703125, -0.97412109375, -0.92791748046875, -0.8817138671875, -0.83551025390625, -0.789306640625, -0.74310302734375, -0.6968994140625, -0.65069580078125, -0.6044921875, -0.55828857421875, -0.5120849609375, -0.46588134765625, -0.419677734375, -0.37347412109375, -0.3272705078125, -0.28106689453125, -0.23486328125, -0.18865966796875, -0.1424560546875, -0.09625244140625, -0.050048828125, -0.00384521484375, 0.0423583984375, 0.08856201171875, 0.134765625, 0.18096923828125, 0.2271728515625, 0.27337646484375, 0.319580078125, 0.36578369140625, 0.4119873046875, 0.45819091796875, 0.50439453125, 0.55059814453125, 0.5968017578125, 0.64300537109375, 0.689208984375, 0.73541259765625, 0.7816162109375, 0.82781982421875, 0.8740234375, 0.92022705078125, 0.9664306640625, 1.01263427734375, 1.058837890625, 1.10504150390625, 1.1512451171875, 1.19744873046875, 1.24365234375, 1.28985595703125, 1.3360595703125, 1.38226318359375, 1.428466796875, 1.47467041015625, 1.5208740234375, 1.56707763671875, 1.61328125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 3.0, 6.0, 8.0, 10.0, 22.0, 18.0, 32.0, 44.0, 81.0, 151.0, 247.0, 483.0, 1125.0, 2731.0, 7923.0, 25051.0, 95344.0, 464482.0, 2740272.0, 683070.0, 125355.0, 32117.0, 9688.0, 3428.0, 1348.0, 548.0, 292.0, 169.0, 74.0, 51.0, 42.0, 24.0, 17.0, 11.0, 6.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.81640625, -3.67291259765625, -3.5294189453125, -3.38592529296875, -3.242431640625, -3.09893798828125, -2.9554443359375, -2.81195068359375, -2.66845703125, -2.52496337890625, -2.3814697265625, -2.23797607421875, -2.094482421875, -1.95098876953125, -1.8074951171875, -1.66400146484375, -1.5205078125, -1.37701416015625, -1.2335205078125, -1.09002685546875, -0.946533203125, -0.80303955078125, -0.6595458984375, -0.51605224609375, -0.37255859375, -0.22906494140625, -0.0855712890625, 0.05792236328125, 0.201416015625, 0.34490966796875, 0.4884033203125, 0.63189697265625, 0.775390625, 0.91888427734375, 1.0623779296875, 1.20587158203125, 1.349365234375, 1.49285888671875, 1.6363525390625, 1.77984619140625, 1.92333984375, 2.06683349609375, 2.2103271484375, 2.35382080078125, 2.497314453125, 2.64080810546875, 2.7843017578125, 2.92779541015625, 3.0712890625, 3.21478271484375, 3.3582763671875, 3.50177001953125, 3.645263671875, 3.78875732421875, 3.9322509765625, 4.07574462890625, 4.21923828125, 4.36273193359375, 4.5062255859375, 4.64971923828125, 4.793212890625, 4.93670654296875, 5.0802001953125, 5.22369384765625, 5.3671875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 12.0, 8.0, 11.0, 13.0, 24.0, 31.0, 47.0, 64.0, 83.0, 142.0, 170.0, 302.0, 477.0, 763.0, 701.0, 416.0, 246.0, 172.0, 107.0, 80.0, 44.0, 53.0, 30.0, 24.0, 18.0, 9.0, 8.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.7503662109375, -4.610107421875, -4.4698486328125, -4.32958984375, -4.1893310546875, -4.049072265625, -3.9088134765625, -3.7685546875, -3.6282958984375, -3.488037109375, -3.3477783203125, -3.20751953125, -3.0672607421875, -2.927001953125, -2.7867431640625, -2.646484375, -2.5062255859375, -2.365966796875, -2.2257080078125, -2.08544921875, -1.9451904296875, -1.804931640625, -1.6646728515625, -1.5244140625, -1.3841552734375, -1.243896484375, -1.1036376953125, -0.96337890625, -0.8231201171875, -0.682861328125, -0.5426025390625, -0.40234375, -0.2620849609375, -0.121826171875, 0.0184326171875, 0.15869140625, 0.2989501953125, 0.439208984375, 0.5794677734375, 0.7197265625, 0.8599853515625, 1.000244140625, 1.1405029296875, 1.28076171875, 1.4210205078125, 1.561279296875, 1.7015380859375, 1.841796875, 1.9820556640625, 2.122314453125, 2.2625732421875, 2.40283203125, 2.5430908203125, 2.683349609375, 2.8236083984375, 2.9638671875, 3.1041259765625, 3.244384765625, 3.3846435546875, 3.52490234375, 3.6651611328125, 3.805419921875, 3.9456787109375, 4.0859375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 13.0, 7.0, 9.0, 22.0, 45.0, 67.0, 71.0, 107.0, 137.0, 142.0, 111.0, 94.0, 68.0, 47.0, 20.0, 18.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.525554656982422, -14.800288200378418, -14.075021743774414, -13.349756240844727, -12.624488830566406, -11.899223327636719, -11.173956871032715, -10.448690414428711, -9.723423957824707, -8.998157501220703, -8.2728910446167, -7.5476250648498535, -6.82235860824585, -6.097092151641846, -5.371826171875, -4.646559715270996, -3.921293258666992, -3.1960268020629883, -2.4707605838775635, -1.7454943656921387, -1.0202279090881348, -0.29496145248413086, 0.43030452728271484, 1.1555709838867188, 1.8808374404907227, 2.6061038970947266, 3.3313701152801514, 4.056636333465576, 4.78190279006958, 5.507169246673584, 6.23243522644043, 6.957701683044434, 7.68297004699707, 8.408236503601074, 9.133502960205078, 9.858768463134766, 10.584035873413086, 11.309301376342773, 12.034567832946777, 12.759834289550781, 13.485100746154785, 14.210367202758789, 14.935633659362793, 15.660900115966797, 16.386165618896484, 17.111433029174805, 17.836698532104492, 18.561965942382812, 19.2872314453125, 20.012496948242188, 20.737764358520508, 21.463029861450195, 22.188297271728516, 22.913562774658203, 23.63882827758789, 24.36409568786621, 25.08936309814453, 25.81462860107422, 26.53989601135254, 27.265161514282227, 27.990428924560547, 28.715694427490234, 29.440959930419922, 30.166227340698242, 30.89149284362793]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 1.0, 7.0, 2.0, 5.0, 9.0, 17.0, 20.0, 19.0, 22.0, 23.0, 23.0, 26.0, 22.0, 24.0, 29.0, 45.0, 34.0, 38.0, 40.0, 39.0, 36.0, 37.0, 42.0, 37.0, 39.0, 30.0, 31.0, 25.0, 33.0, 28.0, 26.0, 23.0, 19.0, 21.0, 14.0, 19.0, 19.0, 13.0, 10.0, 8.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.159262657165527, -9.850515365600586, -9.541768074035645, -9.233020782470703, -8.924274444580078, -8.615527153015137, -8.306779861450195, -7.998032569885254, -7.6892852783203125, -7.380537986755371, -7.07179069519043, -6.7630438804626465, -6.454296588897705, -6.145549297332764, -5.8368024826049805, -5.528055191040039, -5.219307899475098, -4.910560607910156, -4.601813316345215, -4.293066501617432, -3.9843192100524902, -3.675571918487549, -3.3668248653411865, -3.058077812194824, -2.749330520629883, -2.4405832290649414, -2.131836175918579, -1.8230890035629272, -1.5143418312072754, -1.2055946588516235, -0.8968474864959717, -0.5881004333496094, -0.2793540954589844, 0.02939307689666748, 0.33814024925231934, 0.6468874216079712, 0.955634593963623, 1.264381766319275, 1.5731289386749268, 1.881875991821289, 2.1906232833862305, 2.499370574951172, 2.808117628097534, 3.1168646812438965, 3.425611972808838, 3.7343592643737793, 4.0431060791015625, 4.351853370666504, 4.660600662231445, 4.969347953796387, 5.278095245361328, 5.586842060089111, 5.895589351654053, 6.204336643218994, 6.513083457946777, 6.821830749511719, 7.13057804107666, 7.439325332641602, 7.748072624206543, 8.056819915771484, 8.36556625366211, 8.67431354522705, 8.983060836791992, 9.291808128356934, 9.600555419921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 3.0, 7.0, 10.0, 15.0, 26.0, 43.0, 64.0, 67.0, 129.0, 196.0, 314.0, 448.0, 617.0, 970.0, 1397.0, 2156.0, 3194.0, 4472.0, 6823.0, 10706.0, 18168.0, 37653.0, 111625.0, 376851.0, 309672.0, 86102.0, 31834.0, 16093.0, 9536.0, 6386.0, 4186.0, 2820.0, 1955.0, 1338.0, 923.0, 575.0, 372.0, 252.0, 155.0, 134.0, 95.0, 55.0, 41.0, 20.0, 16.0, 8.0, 12.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.181640625, -3.0877685546875, -2.993896484375, -2.9000244140625, -2.80615234375, -2.7122802734375, -2.618408203125, -2.5245361328125, -2.4306640625, -2.3367919921875, -2.242919921875, -2.1490478515625, -2.05517578125, -1.9613037109375, -1.867431640625, -1.7735595703125, -1.6796875, -1.5858154296875, -1.491943359375, -1.3980712890625, -1.30419921875, -1.2103271484375, -1.116455078125, -1.0225830078125, -0.9287109375, -0.8348388671875, -0.740966796875, -0.6470947265625, -0.55322265625, -0.4593505859375, -0.365478515625, -0.2716064453125, -0.177734375, -0.0838623046875, 0.010009765625, 0.1038818359375, 0.19775390625, 0.2916259765625, 0.385498046875, 0.4793701171875, 0.5732421875, 0.6671142578125, 0.760986328125, 0.8548583984375, 0.94873046875, 1.0426025390625, 1.136474609375, 1.2303466796875, 1.32421875, 1.4180908203125, 1.511962890625, 1.6058349609375, 1.69970703125, 1.7935791015625, 1.887451171875, 1.9813232421875, 2.0751953125, 2.1690673828125, 2.262939453125, 2.3568115234375, 2.45068359375, 2.5445556640625, 2.638427734375, 2.7322998046875, 2.826171875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 8.0, 7.0, 8.0, 12.0, 5.0, 13.0, 16.0, 11.0, 13.0, 14.0, 27.0, 24.0, 23.0, 34.0, 24.0, 38.0, 32.0, 27.0, 33.0, 50.0, 38.0, 38.0, 26.0, 41.0, 34.0, 36.0, 39.0, 28.0, 37.0, 23.0, 27.0, 18.0, 22.0, 18.0, 19.0, 15.0, 15.0, 14.0, 10.0, 12.0, 11.0, 11.0, 11.0, 2.0, 5.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.3798828125, -1.3389739990234375, -1.298065185546875, -1.2571563720703125, -1.21624755859375, -1.1753387451171875, -1.134429931640625, -1.0935211181640625, -1.0526123046875, -1.0117034912109375, -0.970794677734375, -0.9298858642578125, -0.88897705078125, -0.8480682373046875, -0.807159423828125, -0.7662506103515625, -0.725341796875, -0.6844329833984375, -0.643524169921875, -0.6026153564453125, -0.56170654296875, -0.5207977294921875, -0.479888916015625, -0.4389801025390625, -0.3980712890625, -0.3571624755859375, -0.316253662109375, -0.2753448486328125, -0.23443603515625, -0.1935272216796875, -0.152618408203125, -0.1117095947265625, -0.07080078125, -0.0298919677734375, 0.011016845703125, 0.0519256591796875, 0.09283447265625, 0.1337432861328125, 0.174652099609375, 0.2155609130859375, 0.2564697265625, 0.2973785400390625, 0.338287353515625, 0.3791961669921875, 0.42010498046875, 0.4610137939453125, 0.501922607421875, 0.5428314208984375, 0.583740234375, 0.6246490478515625, 0.665557861328125, 0.7064666748046875, 0.74737548828125, 0.7882843017578125, 0.829193115234375, 0.8701019287109375, 0.9110107421875, 0.9519195556640625, 0.992828369140625, 1.0337371826171875, 1.07464599609375, 1.1155548095703125, 1.156463623046875, 1.1973724365234375, 1.23828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 5.0, 10.0, 9.0, 19.0, 30.0, 42.0, 63.0, 79.0, 149.0, 220.0, 378.0, 717.0, 1375.0, 2864.0, 6000.0, 13243.0, 29523.0, 83043.0, 395119.0, 382166.0, 79717.0, 28880.0, 12945.0, 5974.0, 2817.0, 1428.0, 715.0, 386.0, 237.0, 128.0, 74.0, 60.0, 42.0, 27.0, 23.0, 16.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.40625, -3.280029296875, -3.15380859375, -3.027587890625, -2.9013671875, -2.775146484375, -2.64892578125, -2.522705078125, -2.396484375, -2.270263671875, -2.14404296875, -2.017822265625, -1.8916015625, -1.765380859375, -1.63916015625, -1.512939453125, -1.38671875, -1.260498046875, -1.13427734375, -1.008056640625, -0.8818359375, -0.755615234375, -0.62939453125, -0.503173828125, -0.376953125, -0.250732421875, -0.12451171875, 0.001708984375, 0.1279296875, 0.254150390625, 0.38037109375, 0.506591796875, 0.6328125, 0.759033203125, 0.88525390625, 1.011474609375, 1.1376953125, 1.263916015625, 1.39013671875, 1.516357421875, 1.642578125, 1.768798828125, 1.89501953125, 2.021240234375, 2.1474609375, 2.273681640625, 2.39990234375, 2.526123046875, 2.65234375, 2.778564453125, 2.90478515625, 3.031005859375, 3.1572265625, 3.283447265625, 3.40966796875, 3.535888671875, 3.662109375, 3.788330078125, 3.91455078125, 4.040771484375, 4.1669921875, 4.293212890625, 4.41943359375, 4.545654296875, 4.671875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 6.0, 6.0, 9.0, 19.0, 17.0, 30.0, 37.0, 34.0, 48.0, 52.0, 49.0, 53.0, 74.0, 49.0, 78.0, 54.0, 58.0, 62.0, 39.0, 51.0, 21.0, 29.0, 24.0, 21.0, 19.0, 9.0, 10.0, 3.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73828125, -5.53778076171875, -5.3372802734375, -5.13677978515625, -4.936279296875, -4.73577880859375, -4.5352783203125, -4.33477783203125, -4.13427734375, -3.93377685546875, -3.7332763671875, -3.53277587890625, -3.332275390625, -3.13177490234375, -2.9312744140625, -2.73077392578125, -2.5302734375, -2.32977294921875, -2.1292724609375, -1.92877197265625, -1.728271484375, -1.52777099609375, -1.3272705078125, -1.12677001953125, -0.92626953125, -0.72576904296875, -0.5252685546875, -0.32476806640625, -0.124267578125, 0.07623291015625, 0.2767333984375, 0.47723388671875, 0.677734375, 0.87823486328125, 1.0787353515625, 1.27923583984375, 1.479736328125, 1.68023681640625, 1.8807373046875, 2.08123779296875, 2.28173828125, 2.48223876953125, 2.6827392578125, 2.88323974609375, 3.083740234375, 3.28424072265625, 3.4847412109375, 3.68524169921875, 3.8857421875, 4.08624267578125, 4.2867431640625, 4.48724365234375, 4.687744140625, 4.88824462890625, 5.0887451171875, 5.28924560546875, 5.48974609375, 5.69024658203125, 5.8907470703125, 6.09124755859375, 6.291748046875, 6.49224853515625, 6.6927490234375, 6.89324951171875, 7.09375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 6.0, 6.0, 6.0, 8.0, 20.0, 37.0, 33.0, 44.0, 60.0, 111.0, 194.0, 278.0, 432.0, 653.0, 1047.0, 1688.0, 2746.0, 4528.0, 7573.0, 13370.0, 26115.0, 56227.0, 141695.0, 333048.0, 266794.0, 101290.0, 42735.0, 20580.0, 10861.0, 6246.0, 3650.0, 2388.0, 1484.0, 960.0, 548.0, 375.0, 220.0, 157.0, 97.0, 61.0, 47.0, 45.0, 30.0, 17.0, 15.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.0869140625, -1.052764892578125, -1.01861572265625, -0.984466552734375, -0.9503173828125, -0.916168212890625, -0.88201904296875, -0.847869873046875, -0.813720703125, -0.779571533203125, -0.74542236328125, -0.711273193359375, -0.6771240234375, -0.642974853515625, -0.60882568359375, -0.574676513671875, -0.54052734375, -0.506378173828125, -0.47222900390625, -0.438079833984375, -0.4039306640625, -0.369781494140625, -0.33563232421875, -0.301483154296875, -0.267333984375, -0.233184814453125, -0.19903564453125, -0.164886474609375, -0.1307373046875, -0.096588134765625, -0.06243896484375, -0.028289794921875, 0.005859375, 0.040008544921875, 0.07415771484375, 0.108306884765625, 0.1424560546875, 0.176605224609375, 0.21075439453125, 0.244903564453125, 0.279052734375, 0.313201904296875, 0.34735107421875, 0.381500244140625, 0.4156494140625, 0.449798583984375, 0.48394775390625, 0.518096923828125, 0.55224609375, 0.586395263671875, 0.62054443359375, 0.654693603515625, 0.6888427734375, 0.722991943359375, 0.75714111328125, 0.791290283203125, 0.825439453125, 0.859588623046875, 0.89373779296875, 0.927886962890625, 0.9620361328125, 0.996185302734375, 1.03033447265625, 1.064483642578125, 1.0986328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 10.0, 13.0, 36.0, 59.0, 110.0, 223.0, 228.0, 125.0, 77.0, 22.0, 22.0, 19.0, 6.0, 5.0, 5.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00069427490234375, -0.0006726160645484924, -0.0006509572267532349, -0.0006292983889579773, -0.0006076395511627197, -0.0005859807133674622, -0.0005643218755722046, -0.000542663037776947, -0.0005210041999816895, -0.0004993453621864319, -0.0004776865243911743, -0.00045602768659591675, -0.0004343688488006592, -0.0004127100110054016, -0.00039105117321014404, -0.0003693923354148865, -0.0003477334976196289, -0.00032607465982437134, -0.00030441582202911377, -0.0002827569842338562, -0.00026109814643859863, -0.00023943930864334106, -0.0002177804708480835, -0.00019612163305282593, -0.00017446279525756836, -0.0001528039574623108, -0.00013114511966705322, -0.00010948628187179565, -8.782744407653809e-05, -6.616860628128052e-05, -4.450976848602295e-05, -2.285093069076538e-05, -1.1920928955078125e-06, 2.0466744899749756e-05, 4.2125582695007324e-05, 6.378442049026489e-05, 8.544325828552246e-05, 0.00010710209608078003, 0.0001287609338760376, 0.00015041977167129517, 0.00017207860946655273, 0.0001937374472618103, 0.00021539628505706787, 0.00023705512285232544, 0.000258713960647583, 0.0002803727984428406, 0.00030203163623809814, 0.0003236904740333557, 0.0003453493118286133, 0.00036700814962387085, 0.0003886669874191284, 0.000410325825214386, 0.00043198466300964355, 0.0004536435008049011, 0.0004753023386001587, 0.0004969611763954163, 0.0005186200141906738, 0.0005402788519859314, 0.000561937689781189, 0.0005835965275764465, 0.0006052553653717041, 0.0006269142031669617, 0.0006485730409622192, 0.0006702318787574768, 0.0006918907165527344]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 3.0, 3.0, 9.0, 6.0, 14.0, 17.0, 29.0, 49.0, 45.0, 74.0, 110.0, 140.0, 242.0, 368.0, 626.0, 1128.0, 1829.0, 3331.0, 6019.0, 11423.0, 23853.0, 53577.0, 130219.0, 271104.0, 286713.0, 144678.0, 59274.0, 26030.0, 12622.0, 6485.0, 3634.0, 1982.0, 1097.0, 646.0, 397.0, 256.0, 180.0, 107.0, 80.0, 45.0, 27.0, 27.0, 17.0, 14.0, 13.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.873046875, -0.8419342041015625, -0.810821533203125, -0.7797088623046875, -0.74859619140625, -0.7174835205078125, -0.686370849609375, -0.6552581787109375, -0.6241455078125, -0.5930328369140625, -0.561920166015625, -0.5308074951171875, -0.49969482421875, -0.4685821533203125, -0.437469482421875, -0.4063568115234375, -0.375244140625, -0.3441314697265625, -0.313018798828125, -0.2819061279296875, -0.25079345703125, -0.2196807861328125, -0.188568115234375, -0.1574554443359375, -0.1263427734375, -0.0952301025390625, -0.064117431640625, -0.0330047607421875, -0.00189208984375, 0.0292205810546875, 0.060333251953125, 0.0914459228515625, 0.12255859375, 0.1536712646484375, 0.184783935546875, 0.2158966064453125, 0.24700927734375, 0.2781219482421875, 0.309234619140625, 0.3403472900390625, 0.3714599609375, 0.4025726318359375, 0.433685302734375, 0.4647979736328125, 0.49591064453125, 0.5270233154296875, 0.558135986328125, 0.5892486572265625, 0.620361328125, 0.6514739990234375, 0.682586669921875, 0.7136993408203125, 0.74481201171875, 0.7759246826171875, 0.807037353515625, 0.8381500244140625, 0.8692626953125, 0.9003753662109375, 0.931488037109375, 0.9626007080078125, 0.99371337890625, 1.0248260498046875, 1.055938720703125, 1.0870513916015625, 1.1181640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 13.0, 9.0, 19.0, 18.0, 23.0, 25.0, 17.0, 24.0, 33.0, 40.0, 62.0, 56.0, 62.0, 54.0, 71.0, 55.0, 54.0, 54.0, 47.0, 44.0, 37.0, 30.0, 22.0, 19.0, 19.0, 17.0, 9.0, 3.0, 6.0, 4.0, 2.0, 4.0, 4.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97412109375, -0.9378738403320312, -0.9016265869140625, -0.8653793334960938, -0.829132080078125, -0.7928848266601562, -0.7566375732421875, -0.7203903198242188, -0.68414306640625, -0.6478958129882812, -0.6116485595703125, -0.5754013061523438, -0.539154052734375, -0.5029067993164062, -0.4666595458984375, -0.43041229248046875, -0.3941650390625, -0.35791778564453125, -0.3216705322265625, -0.28542327880859375, -0.249176025390625, -0.21292877197265625, -0.1766815185546875, -0.14043426513671875, -0.10418701171875, -0.06793975830078125, -0.0316925048828125, 0.00455474853515625, 0.040802001953125, 0.07704925537109375, 0.1132965087890625, 0.14954376220703125, 0.185791015625, 0.22203826904296875, 0.2582855224609375, 0.29453277587890625, 0.330780029296875, 0.36702728271484375, 0.4032745361328125, 0.43952178955078125, 0.47576904296875, 0.5120162963867188, 0.5482635498046875, 0.5845108032226562, 0.620758056640625, 0.6570053100585938, 0.6932525634765625, 0.7294998168945312, 0.7657470703125, 0.8019943237304688, 0.8382415771484375, 0.8744888305664062, 0.910736083984375, 0.9469833374023438, 0.9832305908203125, 1.0194778442382812, 1.05572509765625, 1.0919723510742188, 1.1282196044921875, 1.1644668579101562, 1.200714111328125, 1.2369613647460938, 1.2732086181640625, 1.3094558715820312, 1.345703125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 16.0, 55.0, 119.0, 256.0, 295.0, 175.0, 54.0, 18.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-56.889137268066406, -55.46892166137695, -54.048709869384766, -52.62849426269531, -51.208282470703125, -49.78806686401367, -48.36785125732422, -46.94763946533203, -45.52742385864258, -44.107208251953125, -42.68699645996094, -41.266780853271484, -39.84656524658203, -38.426353454589844, -37.00613784790039, -35.58592224121094, -34.16571044921875, -32.7454948425293, -31.32528305053711, -29.905067443847656, -28.484853744506836, -27.064640045166016, -25.644424438476562, -24.224210739135742, -22.803997039794922, -21.3837833404541, -19.96356964111328, -18.543354034423828, -17.123140335083008, -15.702926635742188, -14.28271198272705, -12.862497329711914, -11.442279815673828, -10.022066116333008, -8.601851463317871, -7.181637287139893, -5.761423110961914, -4.3412089347839355, -2.920994758605957, -1.5007801055908203, -0.08056640625, 1.3396477699279785, 2.759861946105957, 4.1800761222839355, 5.600290298461914, 7.020504474639893, 8.440718650817871, 9.860933303833008, 11.281147003173828, 12.701360702514648, 14.121575355529785, 15.541790008544922, 16.962003707885742, 18.382217407226562, 19.802433013916016, 21.222646713256836, 22.642860412597656, 24.063074111938477, 25.483287811279297, 26.90350341796875, 28.32371711730957, 29.74393081665039, 31.164146423339844, 32.58435821533203, 34.004573822021484]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 7.0, 5.0, 14.0, 13.0, 14.0, 20.0, 18.0, 27.0, 23.0, 40.0, 29.0, 35.0, 41.0, 32.0, 45.0, 40.0, 46.0, 33.0, 34.0, 47.0, 40.0, 42.0, 39.0, 37.0, 33.0, 34.0, 28.0, 30.0, 23.0, 23.0, 12.0, 18.0, 13.0, 10.0, 11.0, 5.0, 7.0, 6.0, 5.0, 5.0, 2.0, 2.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.129358291625977, -11.744454383850098, -11.359551429748535, -10.974647521972656, -10.589743614196777, -10.204839706420898, -9.819936752319336, -9.435032844543457, -9.050128936767578, -8.6652250289917, -8.280322074890137, -7.895418167114258, -7.510514259338379, -7.125610828399658, -6.7407073974609375, -6.355803489685059, -5.970900058746338, -5.585996627807617, -5.201092720031738, -4.816189289093018, -4.431285381317139, -4.046381950378418, -3.661478281021118, -3.2765746116638184, -2.8916709423065186, -2.5067672729492188, -2.121863603591919, -1.7369600534439087, -1.3520563840866089, -0.9671527147293091, -0.5822491645812988, -0.19734549522399902, 0.18755817413330078, 0.5724618434906006, 0.9573654532432556, 1.3422690629959106, 1.7271727323532104, 2.1120762825012207, 2.4969799518585205, 2.8818836212158203, 3.26678729057312, 3.65169095993042, 4.036594390869141, 4.4214982986450195, 4.80640172958374, 5.191305637359619, 5.57620906829834, 5.961112976074219, 6.3460164070129395, 6.73091983795166, 7.115823745727539, 7.50072717666626, 7.885631084442139, 8.27053451538086, 8.655438423156738, 9.040342330932617, 9.42524528503418, 9.810149192810059, 10.195052146911621, 10.5799560546875, 10.964859962463379, 11.349763870239258, 11.73466682434082, 12.1195707321167, 12.504474639892578]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 12.0, 11.0, 22.0, 25.0, 40.0, 46.0, 78.0, 114.0, 191.0, 286.0, 439.0, 730.0, 1297.0, 2610.0, 5722.0, 13106.0, 33701.0, 99867.0, 380969.0, 1872947.0, 1385367.0, 271834.0, 76409.0, 27116.0, 10842.0, 4891.0, 2376.0, 1323.0, 679.0, 438.0, 247.0, 170.0, 100.0, 82.0, 45.0, 51.0, 20.0, 22.0, 13.0, 12.0, 4.0, 2.0, 2.0, 6.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-3.255859375, -3.16253662109375, -3.0692138671875, -2.97589111328125, -2.882568359375, -2.78924560546875, -2.6959228515625, -2.60260009765625, -2.50927734375, -2.41595458984375, -2.3226318359375, -2.22930908203125, -2.135986328125, -2.04266357421875, -1.9493408203125, -1.85601806640625, -1.7626953125, -1.66937255859375, -1.5760498046875, -1.48272705078125, -1.389404296875, -1.29608154296875, -1.2027587890625, -1.10943603515625, -1.01611328125, -0.92279052734375, -0.8294677734375, -0.73614501953125, -0.642822265625, -0.54949951171875, -0.4561767578125, -0.36285400390625, -0.26953125, -0.17620849609375, -0.0828857421875, 0.01043701171875, 0.103759765625, 0.19708251953125, 0.2904052734375, 0.38372802734375, 0.47705078125, 0.57037353515625, 0.6636962890625, 0.75701904296875, 0.850341796875, 0.94366455078125, 1.0369873046875, 1.13031005859375, 1.2236328125, 1.31695556640625, 1.4102783203125, 1.50360107421875, 1.596923828125, 1.69024658203125, 1.7835693359375, 1.87689208984375, 1.97021484375, 2.06353759765625, 2.1568603515625, 2.25018310546875, 2.343505859375, 2.43682861328125, 2.5301513671875, 2.62347412109375, 2.716796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 5.0, 5.0, 9.0, 11.0, 14.0, 11.0, 19.0, 16.0, 16.0, 16.0, 23.0, 24.0, 26.0, 28.0, 33.0, 43.0, 42.0, 46.0, 36.0, 38.0, 47.0, 53.0, 39.0, 43.0, 33.0, 41.0, 38.0, 32.0, 22.0, 26.0, 37.0, 18.0, 14.0, 22.0, 13.0, 11.0, 15.0, 7.0, 6.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.580078125, -1.528533935546875, -1.47698974609375, -1.425445556640625, -1.3739013671875, -1.322357177734375, -1.27081298828125, -1.219268798828125, -1.167724609375, -1.116180419921875, -1.06463623046875, -1.013092041015625, -0.9615478515625, -0.910003662109375, -0.85845947265625, -0.806915283203125, -0.75537109375, -0.703826904296875, -0.65228271484375, -0.600738525390625, -0.5491943359375, -0.497650146484375, -0.44610595703125, -0.394561767578125, -0.343017578125, -0.291473388671875, -0.23992919921875, -0.188385009765625, -0.1368408203125, -0.085296630859375, -0.03375244140625, 0.017791748046875, 0.0693359375, 0.120880126953125, 0.17242431640625, 0.223968505859375, 0.2755126953125, 0.327056884765625, 0.37860107421875, 0.430145263671875, 0.481689453125, 0.533233642578125, 0.58477783203125, 0.636322021484375, 0.6878662109375, 0.739410400390625, 0.79095458984375, 0.842498779296875, 0.89404296875, 0.945587158203125, 0.99713134765625, 1.048675537109375, 1.1002197265625, 1.151763916015625, 1.20330810546875, 1.254852294921875, 1.306396484375, 1.357940673828125, 1.40948486328125, 1.461029052734375, 1.5125732421875, 1.564117431640625, 1.61566162109375, 1.667205810546875, 1.71875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 10.0, 12.0, 24.0, 33.0, 78.0, 100.0, 195.0, 399.0, 723.0, 1509.0, 3571.0, 10438.0, 39883.0, 200652.0, 2159780.0, 1566449.0, 161618.0, 33831.0, 9156.0, 3051.0, 1317.0, 605.0, 367.0, 179.0, 113.0, 66.0, 28.0, 27.0, 18.0, 14.0, 2.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.12188720703125, -4.9508056640625, -4.77972412109375, -4.608642578125, -4.43756103515625, -4.2664794921875, -4.09539794921875, -3.92431640625, -3.75323486328125, -3.5821533203125, -3.41107177734375, -3.239990234375, -3.06890869140625, -2.8978271484375, -2.72674560546875, -2.5556640625, -2.38458251953125, -2.2135009765625, -2.04241943359375, -1.871337890625, -1.70025634765625, -1.5291748046875, -1.35809326171875, -1.18701171875, -1.01593017578125, -0.8448486328125, -0.67376708984375, -0.502685546875, -0.33160400390625, -0.1605224609375, 0.01055908203125, 0.181640625, 0.35272216796875, 0.5238037109375, 0.69488525390625, 0.865966796875, 1.03704833984375, 1.2081298828125, 1.37921142578125, 1.55029296875, 1.72137451171875, 1.8924560546875, 2.06353759765625, 2.234619140625, 2.40570068359375, 2.5767822265625, 2.74786376953125, 2.9189453125, 3.09002685546875, 3.2611083984375, 3.43218994140625, 3.603271484375, 3.77435302734375, 3.9454345703125, 4.11651611328125, 4.28759765625, 4.45867919921875, 4.6297607421875, 4.80084228515625, 4.971923828125, 5.14300537109375, 5.3140869140625, 5.48516845703125, 5.65625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 8.0, 4.0, 3.0, 21.0, 19.0, 26.0, 43.0, 60.0, 79.0, 124.0, 177.0, 312.0, 559.0, 818.0, 679.0, 396.0, 236.0, 159.0, 85.0, 72.0, 53.0, 30.0, 29.0, 18.0, 19.0, 16.0, 2.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.4881591796875, -4.331787109375, -4.1754150390625, -4.01904296875, -3.8626708984375, -3.706298828125, -3.5499267578125, -3.3935546875, -3.2371826171875, -3.080810546875, -2.9244384765625, -2.76806640625, -2.6116943359375, -2.455322265625, -2.2989501953125, -2.142578125, -1.9862060546875, -1.829833984375, -1.6734619140625, -1.51708984375, -1.3607177734375, -1.204345703125, -1.0479736328125, -0.8916015625, -0.7352294921875, -0.578857421875, -0.4224853515625, -0.26611328125, -0.1097412109375, 0.046630859375, 0.2030029296875, 0.359375, 0.5157470703125, 0.672119140625, 0.8284912109375, 0.98486328125, 1.1412353515625, 1.297607421875, 1.4539794921875, 1.6103515625, 1.7667236328125, 1.923095703125, 2.0794677734375, 2.23583984375, 2.3922119140625, 2.548583984375, 2.7049560546875, 2.861328125, 3.0177001953125, 3.174072265625, 3.3304443359375, 3.48681640625, 3.6431884765625, 3.799560546875, 3.9559326171875, 4.1123046875, 4.2686767578125, 4.425048828125, 4.5814208984375, 4.73779296875, 4.8941650390625, 5.050537109375, 5.2069091796875, 5.36328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 9.0, 12.0, 33.0, 72.0, 115.0, 173.0, 167.0, 165.0, 103.0, 82.0, 32.0, 13.0, 13.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.73253631591797, -32.65579605102539, -31.579057693481445, -30.5023193359375, -29.425579071044922, -28.348840713500977, -27.27210235595703, -26.195362091064453, -25.118621826171875, -24.04188346862793, -22.96514320373535, -21.888404846191406, -20.811664581298828, -19.734926223754883, -18.658187866210938, -17.58144760131836, -16.504709243774414, -15.427969932556152, -14.35123062133789, -13.274492263793945, -12.197751998901367, -11.121013641357422, -10.04427433013916, -8.967535018920898, -7.890795707702637, -6.814056396484375, -5.737317085266113, -4.66057825088501, -3.583838939666748, -2.5070996284484863, -1.4303607940673828, -0.3536214828491211, 0.7231178283691406, 1.7998570203781128, 2.876596212387085, 3.9533352851867676, 5.030074596405029, 6.106813907623291, 7.1835527420043945, 8.260292053222656, 9.337031364440918, 10.41377067565918, 11.490509986877441, 12.567249298095703, 13.643987655639648, 14.720727920532227, 15.797466278076172, 16.87420654296875, 17.950944900512695, 19.02768325805664, 20.10442352294922, 21.181161880493164, 22.257902145385742, 23.334640502929688, 24.411380767822266, 25.48811912536621, 26.564857482910156, 27.6415958404541, 28.71833610534668, 29.795074462890625, 30.871814727783203, 31.94855308532715, 33.025291442871094, 34.10203170776367, 35.17877197265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 14.0, 10.0, 14.0, 16.0, 11.0, 14.0, 23.0, 27.0, 20.0, 35.0, 24.0, 22.0, 41.0, 31.0, 37.0, 32.0, 32.0, 40.0, 50.0, 42.0, 45.0, 32.0, 41.0, 26.0, 45.0, 34.0, 34.0, 26.0, 29.0, 23.0, 17.0, 15.0, 13.0, 10.0, 12.0, 7.0, 7.0, 9.0, 2.0, 1.0, 5.0, 7.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.403112411499023, -12.035148620605469, -11.667183876037598, -11.299219131469727, -10.931255340576172, -10.563291549682617, -10.195326805114746, -9.827362060546875, -9.45939826965332, -9.091434478759766, -8.723469734191895, -8.355504989624023, -7.987541198730469, -7.619576930999756, -7.251612663269043, -6.88364839553833, -6.515684127807617, -6.147719860076904, -5.779755592346191, -5.4117913246154785, -5.043827056884766, -4.675862789154053, -4.30789852142334, -3.939934253692627, -3.571969985961914, -3.204005718231201, -2.8360414505004883, -2.4680771827697754, -2.1001129150390625, -1.7321486473083496, -1.3641843795776367, -0.9962201118469238, -0.6282558441162109, -0.26029157638549805, 0.10767269134521484, 0.47563695907592773, 0.8436012268066406, 1.2115654945373535, 1.5795297622680664, 1.9474940299987793, 2.315458297729492, 2.683422565460205, 3.051386833190918, 3.419351100921631, 3.7873153686523438, 4.155279636383057, 4.5232439041137695, 4.891208171844482, 5.259172439575195, 5.627136707305908, 5.995100975036621, 6.363065242767334, 6.731029510498047, 7.09899377822876, 7.466958045959473, 7.8349223136901855, 8.202886581420898, 8.570850372314453, 8.938815116882324, 9.306779861450195, 9.67474365234375, 10.042707443237305, 10.410672187805176, 10.778636932373047, 11.146600723266602]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 7.0, 13.0, 9.0, 28.0, 40.0, 38.0, 87.0, 129.0, 148.0, 237.0, 356.0, 526.0, 762.0, 1195.0, 1731.0, 2614.0, 3952.0, 6206.0, 9329.0, 14719.0, 25348.0, 53694.0, 155237.0, 355555.0, 247430.0, 83311.0, 34142.0, 18631.0, 11504.0, 7411.0, 4698.0, 3176.0, 2104.0, 1439.0, 929.0, 606.0, 377.0, 261.0, 194.0, 117.0, 81.0, 62.0, 37.0, 31.0, 10.0, 16.0, 9.0, 6.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.533203125, -2.45074462890625, -2.3682861328125, -2.28582763671875, -2.203369140625, -2.12091064453125, -2.0384521484375, -1.95599365234375, -1.87353515625, -1.79107666015625, -1.7086181640625, -1.62615966796875, -1.543701171875, -1.46124267578125, -1.3787841796875, -1.29632568359375, -1.2138671875, -1.13140869140625, -1.0489501953125, -0.96649169921875, -0.884033203125, -0.80157470703125, -0.7191162109375, -0.63665771484375, -0.55419921875, -0.47174072265625, -0.3892822265625, -0.30682373046875, -0.224365234375, -0.14190673828125, -0.0594482421875, 0.02301025390625, 0.10546875, 0.18792724609375, 0.2703857421875, 0.35284423828125, 0.435302734375, 0.51776123046875, 0.6002197265625, 0.68267822265625, 0.76513671875, 0.84759521484375, 0.9300537109375, 1.01251220703125, 1.094970703125, 1.17742919921875, 1.2598876953125, 1.34234619140625, 1.4248046875, 1.50726318359375, 1.5897216796875, 1.67218017578125, 1.754638671875, 1.83709716796875, 1.9195556640625, 2.00201416015625, 2.08447265625, 2.16693115234375, 2.2493896484375, 2.33184814453125, 2.414306640625, 2.49676513671875, 2.5792236328125, 2.66168212890625, 2.744140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 8.0, 7.0, 12.0, 12.0, 15.0, 13.0, 28.0, 17.0, 35.0, 30.0, 41.0, 40.0, 47.0, 40.0, 53.0, 51.0, 59.0, 52.0, 39.0, 48.0, 36.0, 51.0, 42.0, 33.0, 38.0, 24.0, 23.0, 19.0, 15.0, 14.0, 6.0, 12.0, 6.0, 6.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8896484375, -1.8302001953125, -1.770751953125, -1.7113037109375, -1.65185546875, -1.5924072265625, -1.532958984375, -1.4735107421875, -1.4140625, -1.3546142578125, -1.295166015625, -1.2357177734375, -1.17626953125, -1.1168212890625, -1.057373046875, -0.9979248046875, -0.9384765625, -0.8790283203125, -0.819580078125, -0.7601318359375, -0.70068359375, -0.6412353515625, -0.581787109375, -0.5223388671875, -0.462890625, -0.4034423828125, -0.343994140625, -0.2845458984375, -0.22509765625, -0.1656494140625, -0.106201171875, -0.0467529296875, 0.0126953125, 0.0721435546875, 0.131591796875, 0.1910400390625, 0.25048828125, 0.3099365234375, 0.369384765625, 0.4288330078125, 0.48828125, 0.5477294921875, 0.607177734375, 0.6666259765625, 0.72607421875, 0.7855224609375, 0.844970703125, 0.9044189453125, 0.9638671875, 1.0233154296875, 1.082763671875, 1.1422119140625, 1.20166015625, 1.2611083984375, 1.320556640625, 1.3800048828125, 1.439453125, 1.4989013671875, 1.558349609375, 1.6177978515625, 1.67724609375, 1.7366943359375, 1.796142578125, 1.8555908203125, 1.9150390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 12.0, 3.0, 8.0, 11.0, 31.0, 30.0, 61.0, 79.0, 116.0, 159.0, 328.0, 598.0, 1218.0, 2530.0, 5846.0, 15134.0, 44435.0, 223876.0, 578253.0, 125233.0, 30799.0, 11044.0, 4578.0, 1995.0, 972.0, 510.0, 269.0, 149.0, 93.0, 56.0, 36.0, 26.0, 19.0, 10.0, 12.0, 9.0, 10.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.12554931640625, -4.9620361328125, -4.79852294921875, -4.635009765625, -4.47149658203125, -4.3079833984375, -4.14447021484375, -3.98095703125, -3.81744384765625, -3.6539306640625, -3.49041748046875, -3.326904296875, -3.16339111328125, -2.9998779296875, -2.83636474609375, -2.6728515625, -2.50933837890625, -2.3458251953125, -2.18231201171875, -2.018798828125, -1.85528564453125, -1.6917724609375, -1.52825927734375, -1.36474609375, -1.20123291015625, -1.0377197265625, -0.87420654296875, -0.710693359375, -0.54718017578125, -0.3836669921875, -0.22015380859375, -0.056640625, 0.10687255859375, 0.2703857421875, 0.43389892578125, 0.597412109375, 0.76092529296875, 0.9244384765625, 1.08795166015625, 1.25146484375, 1.41497802734375, 1.5784912109375, 1.74200439453125, 1.905517578125, 2.06903076171875, 2.2325439453125, 2.39605712890625, 2.5595703125, 2.72308349609375, 2.8865966796875, 3.05010986328125, 3.213623046875, 3.37713623046875, 3.5406494140625, 3.70416259765625, 3.86767578125, 4.03118896484375, 4.1947021484375, 4.35821533203125, 4.521728515625, 4.68524169921875, 4.8487548828125, 5.01226806640625, 5.17578125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 8.0, 7.0, 8.0, 9.0, 16.0, 20.0, 16.0, 25.0, 28.0, 30.0, 28.0, 35.0, 36.0, 40.0, 61.0, 33.0, 42.0, 53.0, 42.0, 54.0, 47.0, 31.0, 26.0, 40.0, 35.0, 34.0, 21.0, 25.0, 21.0, 25.0, 16.0, 14.0, 15.0, 16.0, 5.0, 5.0, 9.0, 2.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.51171875, -6.3167724609375, -6.121826171875, -5.9268798828125, -5.73193359375, -5.5369873046875, -5.342041015625, -5.1470947265625, -4.9521484375, -4.7572021484375, -4.562255859375, -4.3673095703125, -4.17236328125, -3.9774169921875, -3.782470703125, -3.5875244140625, -3.392578125, -3.1976318359375, -3.002685546875, -2.8077392578125, -2.61279296875, -2.4178466796875, -2.222900390625, -2.0279541015625, -1.8330078125, -1.6380615234375, -1.443115234375, -1.2481689453125, -1.05322265625, -0.8582763671875, -0.663330078125, -0.4683837890625, -0.2734375, -0.0784912109375, 0.116455078125, 0.3114013671875, 0.50634765625, 0.7012939453125, 0.896240234375, 1.0911865234375, 1.2861328125, 1.4810791015625, 1.676025390625, 1.8709716796875, 2.06591796875, 2.2608642578125, 2.455810546875, 2.6507568359375, 2.845703125, 3.0406494140625, 3.235595703125, 3.4305419921875, 3.62548828125, 3.8204345703125, 4.015380859375, 4.2103271484375, 4.4052734375, 4.6002197265625, 4.795166015625, 4.9901123046875, 5.18505859375, 5.3800048828125, 5.574951171875, 5.7698974609375, 5.96484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 3.0, 12.0, 18.0, 29.0, 40.0, 50.0, 68.0, 93.0, 154.0, 249.0, 331.0, 594.0, 994.0, 1680.0, 2938.0, 5127.0, 9730.0, 19399.0, 43383.0, 114623.0, 323268.0, 324858.0, 115857.0, 43518.0, 19307.0, 9658.0, 5197.0, 2959.0, 1641.0, 1061.0, 595.0, 395.0, 240.0, 134.0, 102.0, 69.0, 42.0, 32.0, 31.0, 22.0, 12.0, 12.0, 8.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0], "bins": [-1.3828125, -1.3433074951171875, -1.303802490234375, -1.2642974853515625, -1.22479248046875, -1.1852874755859375, -1.145782470703125, -1.1062774658203125, -1.0667724609375, -1.0272674560546875, -0.987762451171875, -0.9482574462890625, -0.90875244140625, -0.8692474365234375, -0.829742431640625, -0.7902374267578125, -0.750732421875, -0.7112274169921875, -0.671722412109375, -0.6322174072265625, -0.59271240234375, -0.5532073974609375, -0.513702392578125, -0.4741973876953125, -0.4346923828125, -0.3951873779296875, -0.355682373046875, -0.3161773681640625, -0.27667236328125, -0.2371673583984375, -0.197662353515625, -0.1581573486328125, -0.11865234375, -0.0791473388671875, -0.039642333984375, -0.0001373291015625, 0.03936767578125, 0.0788726806640625, 0.118377685546875, 0.1578826904296875, 0.1973876953125, 0.2368927001953125, 0.276397705078125, 0.3159027099609375, 0.35540771484375, 0.3949127197265625, 0.434417724609375, 0.4739227294921875, 0.513427734375, 0.5529327392578125, 0.592437744140625, 0.6319427490234375, 0.67144775390625, 0.7109527587890625, 0.750457763671875, 0.7899627685546875, 0.8294677734375, 0.8689727783203125, 0.908477783203125, 0.9479827880859375, 0.98748779296875, 1.0269927978515625, 1.066497802734375, 1.1060028076171875, 1.1455078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 6.0, 3.0, 7.0, 6.0, 7.0, 18.0, 19.0, 26.0, 28.0, 52.0, 82.0, 150.0, 139.0, 146.0, 92.0, 57.0, 32.0, 26.0, 23.0, 17.0, 13.0, 10.0, 11.0, 7.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004892349243164062, -0.0004732981324195862, -0.0004573613405227661, -0.00044142454862594604, -0.000425487756729126, -0.0004095509648323059, -0.00039361417293548584, -0.00037767738103866577, -0.0003617405891418457, -0.00034580379724502563, -0.00032986700534820557, -0.0003139302134513855, -0.00029799342155456543, -0.00028205662965774536, -0.0002661198377609253, -0.0002501830458641052, -0.00023424625396728516, -0.0002183094620704651, -0.00020237267017364502, -0.00018643587827682495, -0.00017049908638000488, -0.00015456229448318481, -0.00013862550258636475, -0.00012268871068954468, -0.00010675191879272461, -9.081512689590454e-05, -7.487833499908447e-05, -5.8941543102264404e-05, -4.3004751205444336e-05, -2.7067959308624268e-05, -1.11311674118042e-05, 4.805624485015869e-06, 2.0742416381835938e-05, 3.6679208278656006e-05, 5.2616000175476074e-05, 6.855279207229614e-05, 8.448958396911621e-05, 0.00010042637586593628, 0.00011636316776275635, 0.00013229995965957642, 0.00014823675155639648, 0.00016417354345321655, 0.00018011033535003662, 0.0001960471272468567, 0.00021198391914367676, 0.00022792071104049683, 0.0002438575029373169, 0.00025979429483413696, 0.00027573108673095703, 0.0002916678786277771, 0.00030760467052459717, 0.00032354146242141724, 0.0003394782543182373, 0.0003554150462150574, 0.00037135183811187744, 0.0003872886300086975, 0.0004032254219055176, 0.00041916221380233765, 0.0004350990056991577, 0.0004510357975959778, 0.00046697258949279785, 0.0004829093813896179, 0.000498846173286438, 0.0005147829651832581, 0.0005307197570800781]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 8.0, 12.0, 7.0, 2.0, 5.0, 9.0, 19.0, 19.0, 27.0, 35.0, 60.0, 85.0, 96.0, 151.0, 236.0, 382.0, 642.0, 1156.0, 2094.0, 4032.0, 8183.0, 17422.0, 40398.0, 102718.0, 272051.0, 344538.0, 151655.0, 56521.0, 23721.0, 10750.0, 5341.0, 2652.0, 1359.0, 775.0, 446.0, 293.0, 203.0, 128.0, 70.0, 79.0, 45.0, 38.0, 26.0, 16.0, 16.0, 12.0, 8.0, 8.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0595703125, -1.0232696533203125, -0.986968994140625, -0.9506683349609375, -0.91436767578125, -0.8780670166015625, -0.841766357421875, -0.8054656982421875, -0.7691650390625, -0.7328643798828125, -0.696563720703125, -0.6602630615234375, -0.62396240234375, -0.5876617431640625, -0.551361083984375, -0.5150604248046875, -0.478759765625, -0.4424591064453125, -0.406158447265625, -0.3698577880859375, -0.33355712890625, -0.2972564697265625, -0.260955810546875, -0.2246551513671875, -0.1883544921875, -0.1520538330078125, -0.115753173828125, -0.0794525146484375, -0.04315185546875, -0.0068511962890625, 0.029449462890625, 0.0657501220703125, 0.10205078125, 0.1383514404296875, 0.174652099609375, 0.2109527587890625, 0.24725341796875, 0.2835540771484375, 0.319854736328125, 0.3561553955078125, 0.3924560546875, 0.4287567138671875, 0.465057373046875, 0.5013580322265625, 0.53765869140625, 0.5739593505859375, 0.610260009765625, 0.6465606689453125, 0.682861328125, 0.7191619873046875, 0.755462646484375, 0.7917633056640625, 0.82806396484375, 0.8643646240234375, 0.900665283203125, 0.9369659423828125, 0.9732666015625, 1.0095672607421875, 1.045867919921875, 1.0821685791015625, 1.11846923828125, 1.1547698974609375, 1.191070556640625, 1.2273712158203125, 1.263671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 4.0, 6.0, 4.0, 4.0, 5.0, 12.0, 17.0, 16.0, 23.0, 35.0, 23.0, 39.0, 64.0, 50.0, 75.0, 90.0, 80.0, 75.0, 80.0, 63.0, 57.0, 43.0, 26.0, 33.0, 22.0, 15.0, 8.0, 10.0, 6.0, 1.0, 5.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8154296875, -1.7667388916015625, -1.718048095703125, -1.6693572998046875, -1.62066650390625, -1.5719757080078125, -1.523284912109375, -1.4745941162109375, -1.4259033203125, -1.3772125244140625, -1.328521728515625, -1.2798309326171875, -1.23114013671875, -1.1824493408203125, -1.133758544921875, -1.0850677490234375, -1.036376953125, -0.9876861572265625, -0.938995361328125, -0.8903045654296875, -0.84161376953125, -0.7929229736328125, -0.744232177734375, -0.6955413818359375, -0.6468505859375, -0.5981597900390625, -0.549468994140625, -0.5007781982421875, -0.45208740234375, -0.4033966064453125, -0.354705810546875, -0.3060150146484375, -0.25732421875, -0.2086334228515625, -0.159942626953125, -0.1112518310546875, -0.06256103515625, -0.0138702392578125, 0.034820556640625, 0.0835113525390625, 0.1322021484375, 0.1808929443359375, 0.229583740234375, 0.2782745361328125, 0.32696533203125, 0.3756561279296875, 0.424346923828125, 0.4730377197265625, 0.521728515625, 0.5704193115234375, 0.619110107421875, 0.6678009033203125, 0.71649169921875, 0.7651824951171875, 0.813873291015625, 0.8625640869140625, 0.9112548828125, 0.9599456787109375, 1.008636474609375, 1.0573272705078125, 1.10601806640625, 1.1547088623046875, 1.203399658203125, 1.2520904541015625, 1.30078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 12.0, 23.0, 52.0, 117.0, 211.0, 226.0, 167.0, 110.0, 53.0, 14.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.001815795898438, -21.930543899536133, -20.859270095825195, -19.78799819946289, -18.716724395751953, -17.64545249938965, -16.574180603027344, -15.502907752990723, -14.431634902954102, -13.36036205291748, -12.28908920288086, -11.217817306518555, -10.146544456481934, -9.075271606445312, -8.003999710083008, -6.932726860046387, -5.861454010009766, -4.7901811599731445, -3.7189087867736816, -2.6476361751556396, -1.5763635635375977, -0.5050907135009766, 0.5661816596984863, 1.6374540328979492, 2.7087268829345703, 3.7799994945526123, 4.851272106170654, 5.922544479370117, 6.993817329406738, 8.06509017944336, 9.136362075805664, 10.207634925842285, 11.278911590576172, 12.350184440612793, 13.421457290649414, 14.492729187011719, 15.56400203704834, 16.63527488708496, 17.706546783447266, 18.777820587158203, 19.849092483520508, 20.920364379882812, 21.99163818359375, 23.062910079956055, 24.13418197631836, 25.205455780029297, 26.2767276763916, 27.347999572753906, 28.419273376464844, 29.49054527282715, 30.561819076538086, 31.63309097290039, 32.70436477661133, 33.775634765625, 34.84690856933594, 35.918182373046875, 36.98945617675781, 38.06072998046875, 39.13199996948242, 40.20327377319336, 41.2745475769043, 42.34581756591797, 43.417091369628906, 44.488365173339844, 45.559635162353516]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 6.0, 9.0, 16.0, 14.0, 16.0, 11.0, 23.0, 29.0, 27.0, 35.0, 29.0, 44.0, 38.0, 29.0, 43.0, 37.0, 45.0, 40.0, 38.0, 33.0, 41.0, 41.0, 39.0, 43.0, 33.0, 37.0, 31.0, 28.0, 13.0, 21.0, 14.0, 15.0, 15.0, 10.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.081348419189453, -12.653268814086914, -12.225190162658691, -11.797110557556152, -11.36903190612793, -10.94095230102539, -10.512872695922852, -10.084793090820312, -9.65671443939209, -9.22863483428955, -8.800556182861328, -8.372476577758789, -7.944397449493408, -7.516318321228027, -7.088238716125488, -6.660159587860107, -6.232080459594727, -5.804001331329346, -5.375922203063965, -4.947842597961426, -4.519763469696045, -4.091684341430664, -3.663604974746704, -3.235525608062744, -2.8074464797973633, -2.3793673515319824, -1.9512879848480225, -1.523208737373352, -1.0951294898986816, -0.6670503616333008, -0.23897099494934082, 0.18910837173461914, 0.6171884536743164, 1.0452677011489868, 1.4733469486236572, 1.9014261960983276, 2.329505443572998, 2.757584571838379, 3.185663938522339, 3.613743305206299, 4.04182243347168, 4.4699015617370605, 4.897980690002441, 5.3260602951049805, 5.754139423370361, 6.182218551635742, 6.610298156738281, 7.038377285003662, 7.466456413269043, 7.894535541534424, 8.322614669799805, 8.750694274902344, 9.178773880004883, 9.606852531433105, 10.034932136535645, 10.463010787963867, 10.891090393066406, 11.319169998168945, 11.747248649597168, 12.175328254699707, 12.60340690612793, 13.031486511230469, 13.459566116333008, 13.887645721435547, 14.31572437286377]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 10.0, 17.0, 23.0, 38.0, 54.0, 75.0, 112.0, 154.0, 265.0, 405.0, 716.0, 1017.0, 1690.0, 2847.0, 4659.0, 8115.0, 13802.0, 24665.0, 45994.0, 89806.0, 188393.0, 433913.0, 961041.0, 1208154.0, 660448.0, 279040.0, 125636.0, 62998.0, 33512.0, 18735.0, 10764.0, 6504.0, 3866.0, 2464.0, 1519.0, 970.0, 638.0, 401.0, 261.0, 195.0, 117.0, 78.0, 52.0, 30.0, 35.0, 13.0, 16.0, 7.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.60546875, -1.5540924072265625, -1.502716064453125, -1.4513397216796875, -1.39996337890625, -1.3485870361328125, -1.297210693359375, -1.2458343505859375, -1.1944580078125, -1.1430816650390625, -1.091705322265625, -1.0403289794921875, -0.98895263671875, -0.9375762939453125, -0.886199951171875, -0.8348236083984375, -0.783447265625, -0.7320709228515625, -0.680694580078125, -0.6293182373046875, -0.57794189453125, -0.5265655517578125, -0.475189208984375, -0.4238128662109375, -0.3724365234375, -0.3210601806640625, -0.269683837890625, -0.2183074951171875, -0.16693115234375, -0.1155548095703125, -0.064178466796875, -0.0128021240234375, 0.03857421875, 0.0899505615234375, 0.141326904296875, 0.1927032470703125, 0.24407958984375, 0.2954559326171875, 0.346832275390625, 0.3982086181640625, 0.4495849609375, 0.5009613037109375, 0.552337646484375, 0.6037139892578125, 0.65509033203125, 0.7064666748046875, 0.757843017578125, 0.8092193603515625, 0.860595703125, 0.9119720458984375, 0.963348388671875, 1.0147247314453125, 1.06610107421875, 1.1174774169921875, 1.168853759765625, 1.2202301025390625, 1.2716064453125, 1.3229827880859375, 1.374359130859375, 1.4257354736328125, 1.47711181640625, 1.5284881591796875, 1.579864501953125, 1.6312408447265625, 1.6826171875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 5.0, 2.0, 3.0, 6.0, 7.0, 13.0, 3.0, 10.0, 6.0, 11.0, 15.0, 21.0, 24.0, 21.0, 24.0, 35.0, 29.0, 35.0, 36.0, 39.0, 33.0, 37.0, 51.0, 37.0, 43.0, 43.0, 44.0, 37.0, 35.0, 38.0, 40.0, 33.0, 16.0, 23.0, 26.0, 14.0, 18.0, 22.0, 11.0, 15.0, 4.0, 13.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4990234375, -1.44525146484375, -1.3914794921875, -1.33770751953125, -1.283935546875, -1.23016357421875, -1.1763916015625, -1.12261962890625, -1.06884765625, -1.01507568359375, -0.9613037109375, -0.90753173828125, -0.853759765625, -0.79998779296875, -0.7462158203125, -0.69244384765625, -0.638671875, -0.58489990234375, -0.5311279296875, -0.47735595703125, -0.423583984375, -0.36981201171875, -0.3160400390625, -0.26226806640625, -0.20849609375, -0.15472412109375, -0.1009521484375, -0.04718017578125, 0.006591796875, 0.06036376953125, 0.1141357421875, 0.16790771484375, 0.2216796875, 0.27545166015625, 0.3292236328125, 0.38299560546875, 0.436767578125, 0.49053955078125, 0.5443115234375, 0.59808349609375, 0.65185546875, 0.70562744140625, 0.7593994140625, 0.81317138671875, 0.866943359375, 0.92071533203125, 0.9744873046875, 1.02825927734375, 1.08203125, 1.13580322265625, 1.1895751953125, 1.24334716796875, 1.297119140625, 1.35089111328125, 1.4046630859375, 1.45843505859375, 1.51220703125, 1.56597900390625, 1.6197509765625, 1.67352294921875, 1.727294921875, 1.78106689453125, 1.8348388671875, 1.88861083984375, 1.9423828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 11.0, 35.0, 48.0, 61.0, 122.0, 210.0, 402.0, 852.0, 2305.0, 8103.0, 40292.0, 282305.0, 2805968.0, 928109.0, 102062.0, 16918.0, 3991.0, 1237.0, 556.0, 294.0, 159.0, 96.0, 48.0, 27.0, 21.0, 11.0, 12.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.859375, -5.66241455078125, -5.4654541015625, -5.26849365234375, -5.071533203125, -4.87457275390625, -4.6776123046875, -4.48065185546875, -4.28369140625, -4.08673095703125, -3.8897705078125, -3.69281005859375, -3.495849609375, -3.29888916015625, -3.1019287109375, -2.90496826171875, -2.7080078125, -2.51104736328125, -2.3140869140625, -2.11712646484375, -1.920166015625, -1.72320556640625, -1.5262451171875, -1.32928466796875, -1.13232421875, -0.93536376953125, -0.7384033203125, -0.54144287109375, -0.344482421875, -0.14752197265625, 0.0494384765625, 0.24639892578125, 0.443359375, 0.64031982421875, 0.8372802734375, 1.03424072265625, 1.231201171875, 1.42816162109375, 1.6251220703125, 1.82208251953125, 2.01904296875, 2.21600341796875, 2.4129638671875, 2.60992431640625, 2.806884765625, 3.00384521484375, 3.2008056640625, 3.39776611328125, 3.5947265625, 3.79168701171875, 3.9886474609375, 4.18560791015625, 4.382568359375, 4.57952880859375, 4.7764892578125, 4.97344970703125, 5.17041015625, 5.36737060546875, 5.5643310546875, 5.76129150390625, 5.958251953125, 6.15521240234375, 6.3521728515625, 6.54913330078125, 6.74609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 16.0, 26.0, 20.0, 38.0, 68.0, 117.0, 148.0, 268.0, 463.0, 789.0, 858.0, 490.0, 286.0, 172.0, 115.0, 76.0, 44.0, 24.0, 16.0, 12.0, 4.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3125, -7.1038818359375, -6.895263671875, -6.6866455078125, -6.47802734375, -6.2694091796875, -6.060791015625, -5.8521728515625, -5.6435546875, -5.4349365234375, -5.226318359375, -5.0177001953125, -4.80908203125, -4.6004638671875, -4.391845703125, -4.1832275390625, -3.974609375, -3.7659912109375, -3.557373046875, -3.3487548828125, -3.14013671875, -2.9315185546875, -2.722900390625, -2.5142822265625, -2.3056640625, -2.0970458984375, -1.888427734375, -1.6798095703125, -1.47119140625, -1.2625732421875, -1.053955078125, -0.8453369140625, -0.63671875, -0.4281005859375, -0.219482421875, -0.0108642578125, 0.19775390625, 0.4063720703125, 0.614990234375, 0.8236083984375, 1.0322265625, 1.2408447265625, 1.449462890625, 1.6580810546875, 1.86669921875, 2.0753173828125, 2.283935546875, 2.4925537109375, 2.701171875, 2.9097900390625, 3.118408203125, 3.3270263671875, 3.53564453125, 3.7442626953125, 3.952880859375, 4.1614990234375, 4.3701171875, 4.5787353515625, 4.787353515625, 4.9959716796875, 5.20458984375, 5.4132080078125, 5.621826171875, 5.8304443359375, 6.0390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 12.0, 22.0, 64.0, 146.0, 255.0, 253.0, 159.0, 59.0, 21.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.74494934082031, -74.0639419555664, -72.3829345703125, -70.7019271850586, -69.02091979980469, -67.33991241455078, -65.65890502929688, -63.97789764404297, -62.29689025878906, -60.615882873535156, -58.93487548828125, -57.253868103027344, -55.57286071777344, -53.89185333251953, -52.210845947265625, -50.52983856201172, -48.84882736206055, -47.16781997680664, -45.486812591552734, -43.80580520629883, -42.12479782104492, -40.443790435791016, -38.762779235839844, -37.08177185058594, -35.40076446533203, -33.719757080078125, -32.03874969482422, -30.357742309570312, -28.676734924316406, -26.9957275390625, -25.31471824645996, -23.633710861206055, -21.95270347595215, -20.271696090698242, -18.590688705444336, -16.909679412841797, -15.228672981262207, -13.5476655960083, -11.866657257080078, -10.185649871826172, -8.504642486572266, -6.823635101318359, -5.142627239227295, -3.4616193771362305, -1.7806119918823242, -0.09960460662841797, 1.5814037322998047, 3.262411117553711, 4.943418502807617, 6.624425888061523, 8.30543327331543, 9.986441612243652, 11.667448997497559, 13.348456382751465, 15.029464721679688, 16.710472106933594, 18.3914794921875, 20.072486877441406, 21.753494262695312, 23.43450164794922, 25.115509033203125, 26.79651641845703, 28.47752571105957, 30.158533096313477, 31.839540481567383]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 9.0, 6.0, 5.0, 11.0, 17.0, 13.0, 19.0, 25.0, 29.0, 40.0, 29.0, 36.0, 36.0, 37.0, 48.0, 56.0, 44.0, 50.0, 52.0, 63.0, 55.0, 44.0, 41.0, 26.0, 48.0, 26.0, 28.0, 17.0, 9.0, 16.0, 14.0, 9.0, 8.0, 11.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.41199493408203, -15.853789329528809, -15.295584678649902, -14.73737907409668, -14.179174423217773, -13.62096881866455, -13.062763214111328, -12.504558563232422, -11.9463529586792, -11.388147354125977, -10.82994270324707, -10.271737098693848, -9.713531494140625, -9.155326843261719, -8.597121238708496, -8.038915634155273, -7.480710983276367, -6.922505855560303, -6.364300727844238, -5.806095123291016, -5.247889995574951, -4.689684867858887, -4.131479263305664, -3.5732741355895996, -3.015069007873535, -2.4568638801574707, -1.8986585140228271, -1.3404532670974731, -0.7822480201721191, -0.2240428924560547, 0.33416247367858887, 0.8923678398132324, 1.4505748748779297, 2.008780002593994, 2.5669853687286377, 3.1251907348632812, 3.6833958625793457, 4.24160099029541, 4.799806594848633, 5.358011722564697, 5.916216850280762, 6.474421977996826, 7.032627105712891, 7.590832710266113, 8.149038314819336, 8.707242965698242, 9.265448570251465, 9.823654174804688, 10.381858825683594, 10.940064430236816, 11.498269081115723, 12.056474685668945, 12.614679336547852, 13.172884941101074, 13.731090545654297, 14.289295196533203, 14.847500801086426, 15.405706405639648, 15.963911056518555, 16.52211570739746, 17.080322265625, 17.638526916503906, 18.196731567382812, 18.75493812561035, 19.313142776489258]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 7.0, 5.0, 3.0, 4.0, 8.0, 21.0, 14.0, 26.0, 35.0, 84.0, 119.0, 186.0, 285.0, 422.0, 716.0, 1098.0, 1915.0, 3190.0, 5063.0, 8157.0, 13365.0, 22283.0, 41961.0, 97821.0, 248287.0, 318069.0, 152764.0, 59854.0, 29369.0, 16924.0, 10356.0, 6238.0, 3712.0, 2283.0, 1446.0, 931.0, 547.0, 357.0, 221.0, 148.0, 95.0, 58.0, 45.0, 31.0, 17.0, 10.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.798828125, -2.714599609375, -2.63037109375, -2.546142578125, -2.4619140625, -2.377685546875, -2.29345703125, -2.209228515625, -2.125, -2.040771484375, -1.95654296875, -1.872314453125, -1.7880859375, -1.703857421875, -1.61962890625, -1.535400390625, -1.451171875, -1.366943359375, -1.28271484375, -1.198486328125, -1.1142578125, -1.030029296875, -0.94580078125, -0.861572265625, -0.77734375, -0.693115234375, -0.60888671875, -0.524658203125, -0.4404296875, -0.356201171875, -0.27197265625, -0.187744140625, -0.103515625, -0.019287109375, 0.06494140625, 0.149169921875, 0.2333984375, 0.317626953125, 0.40185546875, 0.486083984375, 0.5703125, 0.654541015625, 0.73876953125, 0.822998046875, 0.9072265625, 0.991455078125, 1.07568359375, 1.159912109375, 1.244140625, 1.328369140625, 1.41259765625, 1.496826171875, 1.5810546875, 1.665283203125, 1.74951171875, 1.833740234375, 1.91796875, 2.002197265625, 2.08642578125, 2.170654296875, 2.2548828125, 2.339111328125, 2.42333984375, 2.507568359375, 2.591796875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 11.0, 9.0, 8.0, 22.0, 21.0, 20.0, 17.0, 27.0, 34.0, 21.0, 33.0, 33.0, 43.0, 34.0, 38.0, 54.0, 52.0, 65.0, 50.0, 42.0, 37.0, 45.0, 29.0, 26.0, 31.0, 40.0, 21.0, 20.0, 16.0, 16.0, 11.0, 19.0, 11.0, 7.0, 7.0, 9.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.9697265625, -1.9087677001953125, -1.847808837890625, -1.7868499755859375, -1.72589111328125, -1.6649322509765625, -1.603973388671875, -1.5430145263671875, -1.4820556640625, -1.4210968017578125, -1.360137939453125, -1.2991790771484375, -1.23822021484375, -1.1772613525390625, -1.116302490234375, -1.0553436279296875, -0.994384765625, -0.9334259033203125, -0.872467041015625, -0.8115081787109375, -0.75054931640625, -0.6895904541015625, -0.628631591796875, -0.5676727294921875, -0.5067138671875, -0.4457550048828125, -0.384796142578125, -0.3238372802734375, -0.26287841796875, -0.2019195556640625, -0.140960693359375, -0.0800018310546875, -0.01904296875, 0.0419158935546875, 0.102874755859375, 0.1638336181640625, 0.22479248046875, 0.2857513427734375, 0.346710205078125, 0.4076690673828125, 0.4686279296875, 0.5295867919921875, 0.590545654296875, 0.6515045166015625, 0.71246337890625, 0.7734222412109375, 0.834381103515625, 0.8953399658203125, 0.956298828125, 1.0172576904296875, 1.078216552734375, 1.1391754150390625, 1.20013427734375, 1.2610931396484375, 1.322052001953125, 1.3830108642578125, 1.4439697265625, 1.5049285888671875, 1.565887451171875, 1.6268463134765625, 1.68780517578125, 1.7487640380859375, 1.809722900390625, 1.8706817626953125, 1.931640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 5.0, 7.0, 11.0, 14.0, 22.0, 31.0, 38.0, 41.0, 87.0, 130.0, 220.0, 472.0, 918.0, 1923.0, 5113.0, 14841.0, 46004.0, 227565.0, 572259.0, 129576.0, 31642.0, 10671.0, 3842.0, 1552.0, 693.0, 355.0, 182.0, 127.0, 62.0, 44.0, 31.0, 21.0, 24.0, 11.0, 10.0, 2.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.53253173828125, -5.3502197265625, -5.16790771484375, -4.985595703125, -4.80328369140625, -4.6209716796875, -4.43865966796875, -4.25634765625, -4.07403564453125, -3.8917236328125, -3.70941162109375, -3.527099609375, -3.34478759765625, -3.1624755859375, -2.98016357421875, -2.7978515625, -2.61553955078125, -2.4332275390625, -2.25091552734375, -2.068603515625, -1.88629150390625, -1.7039794921875, -1.52166748046875, -1.33935546875, -1.15704345703125, -0.9747314453125, -0.79241943359375, -0.610107421875, -0.42779541015625, -0.2454833984375, -0.06317138671875, 0.119140625, 0.30145263671875, 0.4837646484375, 0.66607666015625, 0.848388671875, 1.03070068359375, 1.2130126953125, 1.39532470703125, 1.57763671875, 1.75994873046875, 1.9422607421875, 2.12457275390625, 2.306884765625, 2.48919677734375, 2.6715087890625, 2.85382080078125, 3.0361328125, 3.21844482421875, 3.4007568359375, 3.58306884765625, 3.765380859375, 3.94769287109375, 4.1300048828125, 4.31231689453125, 4.49462890625, 4.67694091796875, 4.8592529296875, 5.04156494140625, 5.223876953125, 5.40618896484375, 5.5885009765625, 5.77081298828125, 5.953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 12.0, 10.0, 10.0, 8.0, 10.0, 23.0, 17.0, 21.0, 34.0, 30.0, 41.0, 27.0, 38.0, 43.0, 45.0, 55.0, 47.0, 50.0, 41.0, 55.0, 51.0, 49.0, 43.0, 17.0, 34.0, 36.0, 40.0, 20.0, 23.0, 13.0, 13.0, 7.0, 6.0, 6.0, 6.0, 7.0, 1.0, 6.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.74609375, -6.53863525390625, -6.3311767578125, -6.12371826171875, -5.916259765625, -5.70880126953125, -5.5013427734375, -5.29388427734375, -5.08642578125, -4.87896728515625, -4.6715087890625, -4.46405029296875, -4.256591796875, -4.04913330078125, -3.8416748046875, -3.63421630859375, -3.4267578125, -3.21929931640625, -3.0118408203125, -2.80438232421875, -2.596923828125, -2.38946533203125, -2.1820068359375, -1.97454833984375, -1.76708984375, -1.55963134765625, -1.3521728515625, -1.14471435546875, -0.937255859375, -0.72979736328125, -0.5223388671875, -0.31488037109375, -0.107421875, 0.10003662109375, 0.3074951171875, 0.51495361328125, 0.722412109375, 0.92987060546875, 1.1373291015625, 1.34478759765625, 1.55224609375, 1.75970458984375, 1.9671630859375, 2.17462158203125, 2.382080078125, 2.58953857421875, 2.7969970703125, 3.00445556640625, 3.2119140625, 3.41937255859375, 3.6268310546875, 3.83428955078125, 4.041748046875, 4.24920654296875, 4.4566650390625, 4.66412353515625, 4.87158203125, 5.07904052734375, 5.2864990234375, 5.49395751953125, 5.701416015625, 5.90887451171875, 6.1163330078125, 6.32379150390625, 6.53125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 11.0, 13.0, 19.0, 30.0, 44.0, 79.0, 99.0, 200.0, 330.0, 555.0, 1043.0, 1877.0, 3304.0, 5924.0, 11196.0, 22537.0, 55347.0, 165963.0, 385045.0, 250420.0, 82625.0, 30655.0, 14369.0, 7565.0, 4160.0, 2220.0, 1226.0, 704.0, 396.0, 254.0, 136.0, 69.0, 54.0, 30.0, 19.0, 11.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.396270751953125, -1.35601806640625, -1.315765380859375, -1.2755126953125, -1.235260009765625, -1.19500732421875, -1.154754638671875, -1.114501953125, -1.074249267578125, -1.03399658203125, -0.993743896484375, -0.9534912109375, -0.913238525390625, -0.87298583984375, -0.832733154296875, -0.79248046875, -0.752227783203125, -0.71197509765625, -0.671722412109375, -0.6314697265625, -0.591217041015625, -0.55096435546875, -0.510711669921875, -0.470458984375, -0.430206298828125, -0.38995361328125, -0.349700927734375, -0.3094482421875, -0.269195556640625, -0.22894287109375, -0.188690185546875, -0.1484375, -0.108184814453125, -0.06793212890625, -0.027679443359375, 0.0125732421875, 0.052825927734375, 0.09307861328125, 0.133331298828125, 0.173583984375, 0.213836669921875, 0.25408935546875, 0.294342041015625, 0.3345947265625, 0.374847412109375, 0.41510009765625, 0.455352783203125, 0.49560546875, 0.535858154296875, 0.57611083984375, 0.616363525390625, 0.6566162109375, 0.696868896484375, 0.73712158203125, 0.777374267578125, 0.817626953125, 0.857879638671875, 0.89813232421875, 0.938385009765625, 0.9786376953125, 1.018890380859375, 1.05914306640625, 1.099395751953125, 1.1396484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 5.0, 8.0, 10.0, 15.0, 14.0, 34.0, 58.0, 70.0, 121.0, 177.0, 155.0, 110.0, 78.0, 38.0, 25.0, 21.0, 8.0, 11.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006437301635742188, -0.000625312328338623, -0.0006068944931030273, -0.0005884766578674316, -0.0005700588226318359, -0.0005516409873962402, -0.0005332231521606445, -0.0005148053169250488, -0.0004963874816894531, -0.0004779696464538574, -0.0004595518112182617, -0.000441133975982666, -0.0004227161407470703, -0.0004042983055114746, -0.0003858804702758789, -0.0003674626350402832, -0.0003490447998046875, -0.0003306269645690918, -0.0003122091293334961, -0.0002937912940979004, -0.0002753734588623047, -0.000256955623626709, -0.00023853778839111328, -0.00022011995315551758, -0.00020170211791992188, -0.00018328428268432617, -0.00016486644744873047, -0.00014644861221313477, -0.00012803077697753906, -0.00010961294174194336, -9.119510650634766e-05, -7.277727127075195e-05, -5.435943603515625e-05, -3.594160079956055e-05, -1.7523765563964844e-05, 8.940696716308594e-07, 1.9311904907226562e-05, 3.7729740142822266e-05, 5.614757537841797e-05, 7.456541061401367e-05, 9.298324584960938e-05, 0.00011140108108520508, 0.00012981891632080078, 0.00014823675155639648, 0.0001666545867919922, 0.0001850724220275879, 0.0002034902572631836, 0.0002219080924987793, 0.000240325927734375, 0.0002587437629699707, 0.0002771615982055664, 0.0002955794334411621, 0.0003139972686767578, 0.0003324151039123535, 0.0003508329391479492, 0.0003692507743835449, 0.0003876686096191406, 0.00040608644485473633, 0.00042450428009033203, 0.00044292211532592773, 0.00046133995056152344, 0.00047975778579711914, 0.0004981756210327148, 0.0005165934562683105, 0.0005350112915039062]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 7.0, 16.0, 20.0, 13.0, 36.0, 54.0, 86.0, 122.0, 174.0, 351.0, 564.0, 1249.0, 2739.0, 6444.0, 16787.0, 48440.0, 159019.0, 392907.0, 282476.0, 89576.0, 28612.0, 10572.0, 4303.0, 1966.0, 881.0, 462.0, 234.0, 165.0, 94.0, 52.0, 41.0, 24.0, 21.0, 13.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2744140625, -1.2329864501953125, -1.191558837890625, -1.1501312255859375, -1.10870361328125, -1.0672760009765625, -1.025848388671875, -0.9844207763671875, -0.9429931640625, -0.9015655517578125, -0.860137939453125, -0.8187103271484375, -0.77728271484375, -0.7358551025390625, -0.694427490234375, -0.6529998779296875, -0.611572265625, -0.5701446533203125, -0.528717041015625, -0.4872894287109375, -0.44586181640625, -0.4044342041015625, -0.363006591796875, -0.3215789794921875, -0.2801513671875, -0.2387237548828125, -0.197296142578125, -0.1558685302734375, -0.11444091796875, -0.0730133056640625, -0.031585693359375, 0.0098419189453125, 0.05126953125, 0.0926971435546875, 0.134124755859375, 0.1755523681640625, 0.21697998046875, 0.2584075927734375, 0.299835205078125, 0.3412628173828125, 0.3826904296875, 0.4241180419921875, 0.465545654296875, 0.5069732666015625, 0.54840087890625, 0.5898284912109375, 0.631256103515625, 0.6726837158203125, 0.714111328125, 0.7555389404296875, 0.796966552734375, 0.8383941650390625, 0.87982177734375, 0.9212493896484375, 0.962677001953125, 1.0041046142578125, 1.0455322265625, 1.0869598388671875, 1.128387451171875, 1.1698150634765625, 1.21124267578125, 1.2526702880859375, 1.294097900390625, 1.3355255126953125, 1.376953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 8.0, 5.0, 13.0, 18.0, 18.0, 15.0, 29.0, 35.0, 38.0, 42.0, 43.0, 51.0, 62.0, 60.0, 58.0, 58.0, 56.0, 63.0, 46.0, 48.0, 40.0, 35.0, 24.0, 19.0, 20.0, 9.0, 11.0, 5.0, 9.0, 4.0, 7.0, 5.0, 5.0, 7.0, 2.0, 6.0, 0.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98046875, -0.9474029541015625, -0.914337158203125, -0.8812713623046875, -0.84820556640625, -0.8151397705078125, -0.782073974609375, -0.7490081787109375, -0.7159423828125, -0.6828765869140625, -0.649810791015625, -0.6167449951171875, -0.58367919921875, -0.5506134033203125, -0.517547607421875, -0.4844818115234375, -0.451416015625, -0.4183502197265625, -0.385284423828125, -0.3522186279296875, -0.31915283203125, -0.2860870361328125, -0.253021240234375, -0.2199554443359375, -0.1868896484375, -0.1538238525390625, -0.120758056640625, -0.0876922607421875, -0.05462646484375, -0.0215606689453125, 0.011505126953125, 0.0445709228515625, 0.07763671875, 0.1107025146484375, 0.143768310546875, 0.1768341064453125, 0.20989990234375, 0.2429656982421875, 0.276031494140625, 0.3090972900390625, 0.3421630859375, 0.3752288818359375, 0.408294677734375, 0.4413604736328125, 0.47442626953125, 0.5074920654296875, 0.540557861328125, 0.5736236572265625, 0.606689453125, 0.6397552490234375, 0.672821044921875, 0.7058868408203125, 0.73895263671875, 0.7720184326171875, 0.805084228515625, 0.8381500244140625, 0.8712158203125, 0.9042816162109375, 0.937347412109375, 0.9704132080078125, 1.00347900390625, 1.0365447998046875, 1.069610595703125, 1.1026763916015625, 1.1357421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 19.0, 27.0, 64.0, 143.0, 148.0, 208.0, 166.0, 111.0, 50.0, 28.0, 22.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.37370491027832, -17.480655670166016, -16.587604522705078, -15.694555282592773, -14.801506042480469, -13.908456802368164, -13.015406608581543, -12.122356414794922, -11.229307174682617, -10.336257934570312, -9.443207740783691, -8.55015754699707, -7.657108306884766, -6.764058589935303, -5.87100887298584, -4.977959156036377, -4.084909439086914, -3.191859722137451, -2.2988100051879883, -1.4057602882385254, -0.5127105712890625, 0.3803391456604004, 1.2733888626098633, 2.166438579559326, 3.059488296508789, 3.952538013458252, 4.845587730407715, 5.738637447357178, 6.631687164306641, 7.5247368812561035, 8.417786598205566, 9.310836791992188, 10.203887939453125, 11.09693717956543, 11.98998737335205, 12.883037567138672, 13.776086807250977, 14.669136047363281, 15.562186241149902, 16.455236434936523, 17.348285675048828, 18.241334915161133, 19.134384155273438, 20.027435302734375, 20.92048454284668, 21.813533782958984, 22.706584930419922, 23.599634170532227, 24.49268341064453, 25.385732650756836, 26.27878189086914, 27.171833038330078, 28.064882278442383, 28.957931518554688, 29.850982666015625, 30.74403190612793, 31.637081146240234, 32.53013229370117, 33.423179626464844, 34.31623077392578, 35.20928192138672, 36.10232925415039, 36.99538040161133, 37.888427734375, 38.78147888183594]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 2.0, 11.0, 9.0, 8.0, 14.0, 14.0, 19.0, 19.0, 35.0, 33.0, 25.0, 34.0, 32.0, 44.0, 42.0, 41.0, 48.0, 46.0, 58.0, 53.0, 41.0, 33.0, 52.0, 35.0, 31.0, 30.0, 19.0, 31.0, 29.0, 13.0, 13.0, 14.0, 10.0, 6.0, 14.0, 7.0, 4.0, 6.0, 2.0, 3.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.734094619750977, -14.256233215332031, -13.778371810913086, -13.30051040649414, -12.822648048400879, -12.344786643981934, -11.866925239562988, -11.389063835144043, -10.911201477050781, -10.433340072631836, -9.95547866821289, -9.477617263793945, -8.999754905700684, -8.521893501281738, -8.044032096862793, -7.566170692443848, -7.088309288024902, -6.610447883605957, -6.1325860023498535, -5.654724597930908, -5.176862716674805, -4.699001312255859, -4.221139907836914, -3.7432782649993896, -3.2654166221618652, -2.787554979324341, -2.3096933364868164, -1.831831932067871, -1.3539702892303467, -0.8761086463928223, -0.39824724197387695, 0.07961440086364746, 0.5574769973754883, 1.0353386402130127, 1.5132001638412476, 1.9910616874694824, 2.468923330307007, 2.9467849731445312, 3.4246463775634766, 3.902508020401001, 4.380369663238525, 4.858231067657471, 5.336092948913574, 5.8139543533325195, 6.291815757751465, 6.769677639007568, 7.247539043426514, 7.725400924682617, 8.203262329101562, 8.681123733520508, 9.158985137939453, 9.636846542358398, 10.11470890045166, 10.592570304870605, 11.07043170928955, 11.548293113708496, 12.026155471801758, 12.504016876220703, 12.981878280639648, 13.459739685058594, 13.937602043151855, 14.4154634475708, 14.893324851989746, 15.371186256408691, 15.849047660827637]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 12.0, 11.0, 27.0, 36.0, 53.0, 76.0, 160.0, 260.0, 499.0, 1069.0, 2450.0, 5838.0, 15448.0, 44820.0, 146965.0, 553301.0, 1681536.0, 1262143.0, 336998.0, 93768.0, 30139.0, 10645.0, 4293.0, 1870.0, 821.0, 419.0, 224.0, 133.0, 89.0, 54.0, 45.0, 27.0, 15.0, 9.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.392578125, -2.312347412109375, -2.23211669921875, -2.151885986328125, -2.0716552734375, -1.991424560546875, -1.91119384765625, -1.830963134765625, -1.750732421875, -1.670501708984375, -1.59027099609375, -1.510040283203125, -1.4298095703125, -1.349578857421875, -1.26934814453125, -1.189117431640625, -1.10888671875, -1.028656005859375, -0.94842529296875, -0.868194580078125, -0.7879638671875, -0.707733154296875, -0.62750244140625, -0.547271728515625, -0.467041015625, -0.386810302734375, -0.30657958984375, -0.226348876953125, -0.1461181640625, -0.065887451171875, 0.01434326171875, 0.094573974609375, 0.1748046875, 0.255035400390625, 0.33526611328125, 0.415496826171875, 0.4957275390625, 0.575958251953125, 0.65618896484375, 0.736419677734375, 0.816650390625, 0.896881103515625, 0.97711181640625, 1.057342529296875, 1.1375732421875, 1.217803955078125, 1.29803466796875, 1.378265380859375, 1.45849609375, 1.538726806640625, 1.61895751953125, 1.699188232421875, 1.7794189453125, 1.859649658203125, 1.93988037109375, 2.020111083984375, 2.100341796875, 2.180572509765625, 2.26080322265625, 2.341033935546875, 2.4212646484375, 2.501495361328125, 2.58172607421875, 2.661956787109375, 2.7421875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 8.0, 10.0, 11.0, 19.0, 24.0, 30.0, 27.0, 40.0, 27.0, 37.0, 39.0, 33.0, 58.0, 54.0, 43.0, 43.0, 44.0, 45.0, 55.0, 46.0, 38.0, 34.0, 43.0, 22.0, 24.0, 28.0, 21.0, 11.0, 8.0, 10.0, 15.0, 8.0, 6.0, 7.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8388671875, -1.7763824462890625, -1.713897705078125, -1.6514129638671875, -1.58892822265625, -1.5264434814453125, -1.463958740234375, -1.4014739990234375, -1.3389892578125, -1.2765045166015625, -1.214019775390625, -1.1515350341796875, -1.08905029296875, -1.0265655517578125, -0.964080810546875, -0.9015960693359375, -0.839111328125, -0.7766265869140625, -0.714141845703125, -0.6516571044921875, -0.58917236328125, -0.5266876220703125, -0.464202880859375, -0.4017181396484375, -0.3392333984375, -0.2767486572265625, -0.214263916015625, -0.1517791748046875, -0.08929443359375, -0.0268096923828125, 0.035675048828125, 0.0981597900390625, 0.16064453125, 0.2231292724609375, 0.285614013671875, 0.3480987548828125, 0.41058349609375, 0.4730682373046875, 0.535552978515625, 0.5980377197265625, 0.6605224609375, 0.7230072021484375, 0.785491943359375, 0.8479766845703125, 0.91046142578125, 0.9729461669921875, 1.035430908203125, 1.0979156494140625, 1.160400390625, 1.2228851318359375, 1.285369873046875, 1.3478546142578125, 1.41033935546875, 1.4728240966796875, 1.535308837890625, 1.5977935791015625, 1.6602783203125, 1.7227630615234375, 1.785247802734375, 1.8477325439453125, 1.91021728515625, 1.9727020263671875, 2.035186767578125, 2.0976715087890625, 2.16015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 20.0, 33.0, 45.0, 69.0, 120.0, 235.0, 377.0, 792.0, 1653.0, 4090.0, 11856.0, 45446.0, 223942.0, 1697297.0, 1889179.0, 249072.0, 49479.0, 12681.0, 4308.0, 1774.0, 838.0, 399.0, 213.0, 135.0, 85.0, 51.0, 25.0, 18.0, 7.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.671875, -4.52130126953125, -4.3707275390625, -4.22015380859375, -4.069580078125, -3.91900634765625, -3.7684326171875, -3.61785888671875, -3.46728515625, -3.31671142578125, -3.1661376953125, -3.01556396484375, -2.864990234375, -2.71441650390625, -2.5638427734375, -2.41326904296875, -2.2626953125, -2.11212158203125, -1.9615478515625, -1.81097412109375, -1.660400390625, -1.50982666015625, -1.3592529296875, -1.20867919921875, -1.05810546875, -0.90753173828125, -0.7569580078125, -0.60638427734375, -0.455810546875, -0.30523681640625, -0.1546630859375, -0.00408935546875, 0.146484375, 0.29705810546875, 0.4476318359375, 0.59820556640625, 0.748779296875, 0.89935302734375, 1.0499267578125, 1.20050048828125, 1.35107421875, 1.50164794921875, 1.6522216796875, 1.80279541015625, 1.953369140625, 2.10394287109375, 2.2545166015625, 2.40509033203125, 2.5556640625, 2.70623779296875, 2.8568115234375, 3.00738525390625, 3.157958984375, 3.30853271484375, 3.4591064453125, 3.60968017578125, 3.76025390625, 3.91082763671875, 4.0614013671875, 4.21197509765625, 4.362548828125, 4.51312255859375, 4.6636962890625, 4.81427001953125, 4.96484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 9.0, 17.0, 12.0, 23.0, 28.0, 51.0, 72.0, 74.0, 109.0, 169.0, 230.0, 306.0, 510.0, 629.0, 522.0, 408.0, 245.0, 185.0, 128.0, 89.0, 68.0, 38.0, 31.0, 33.0, 23.0, 16.0, 17.0, 5.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.113861083984375, -2.97576904296875, -2.837677001953125, -2.6995849609375, -2.561492919921875, -2.42340087890625, -2.285308837890625, -2.147216796875, -2.009124755859375, -1.87103271484375, -1.732940673828125, -1.5948486328125, -1.456756591796875, -1.31866455078125, -1.180572509765625, -1.04248046875, -0.904388427734375, -0.76629638671875, -0.628204345703125, -0.4901123046875, -0.352020263671875, -0.21392822265625, -0.075836181640625, 0.062255859375, 0.200347900390625, 0.33843994140625, 0.476531982421875, 0.6146240234375, 0.752716064453125, 0.89080810546875, 1.028900146484375, 1.1669921875, 1.305084228515625, 1.44317626953125, 1.581268310546875, 1.7193603515625, 1.857452392578125, 1.99554443359375, 2.133636474609375, 2.271728515625, 2.409820556640625, 2.54791259765625, 2.686004638671875, 2.8240966796875, 2.962188720703125, 3.10028076171875, 3.238372802734375, 3.37646484375, 3.514556884765625, 3.65264892578125, 3.790740966796875, 3.9288330078125, 4.066925048828125, 4.20501708984375, 4.343109130859375, 4.481201171875, 4.619293212890625, 4.75738525390625, 4.895477294921875, 5.0335693359375, 5.171661376953125, 5.30975341796875, 5.447845458984375, 5.5859375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 6.0, 9.0, 35.0, 90.0, 217.0, 293.0, 215.0, 95.0, 26.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.83698654174805, -57.022987365722656, -55.208984375, -53.39498519897461, -51.58098220825195, -49.76698303222656, -47.952980041503906, -46.138980865478516, -44.324981689453125, -42.510982513427734, -40.69697952270508, -38.88298034667969, -37.06897735595703, -35.25497817993164, -33.44097900390625, -31.626976013183594, -29.812973022460938, -27.998971939086914, -26.18497085571289, -24.3709716796875, -22.556968688964844, -20.742969512939453, -18.92896842956543, -17.114967346191406, -15.300966262817383, -13.48696517944336, -11.672964096069336, -9.858963966369629, -8.044962882995605, -6.230961799621582, -4.416961669921875, -2.6029605865478516, -0.7889633178710938, 1.0250375270843506, 2.839038372039795, 4.65303897857666, 6.467040061950684, 8.281041145324707, 10.095041275024414, 11.909042358398438, 13.723043441772461, 15.537044525146484, 17.351045608520508, 19.16504669189453, 20.979045867919922, 22.793048858642578, 24.60704803466797, 26.421049118041992, 28.235050201416016, 30.04905128479004, 31.863052368164062, 33.67705154418945, 35.49105453491211, 37.3050537109375, 39.119056701660156, 40.93305587768555, 42.74705505371094, 44.56105422973633, 46.375057220458984, 48.189056396484375, 50.00305938720703, 51.81705856323242, 53.63105773925781, 55.44506072998047, 57.259063720703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 10.0, 8.0, 8.0, 10.0, 17.0, 9.0, 14.0, 20.0, 28.0, 20.0, 32.0, 25.0, 31.0, 38.0, 26.0, 28.0, 37.0, 40.0, 36.0, 35.0, 41.0, 31.0, 45.0, 33.0, 43.0, 54.0, 43.0, 36.0, 26.0, 25.0, 28.0, 14.0, 17.0, 15.0, 17.0, 13.0, 10.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.789836883544922, -12.391395568847656, -11.99295425415039, -11.594512939453125, -11.19607162475586, -10.797630310058594, -10.399188995361328, -10.000747680664062, -9.602306365966797, -9.203865051269531, -8.805423736572266, -8.406982421875, -8.008541107177734, -7.610099792480469, -7.211658477783203, -6.8132171630859375, -6.41477632522583, -6.0163350105285645, -5.617893695831299, -5.219452381134033, -4.821011066436768, -4.422569751739502, -4.0241289138793945, -3.62568736076355, -3.227246046066284, -2.8288047313690186, -2.430363416671753, -2.0319223403930664, -1.6334809064865112, -1.2350395917892456, -0.8365983963012695, -0.4381570816040039, -0.03971576690673828, 0.35872551798820496, 0.7571668028831482, 1.155608057975769, 1.5540493726730347, 1.9524906873703003, 2.3509318828582764, 2.749373197555542, 3.1478145122528076, 3.5462558269500732, 3.944697141647339, 4.343138217926025, 4.741579532623291, 5.140020847320557, 5.538462162017822, 5.936903476715088, 6.3353447914123535, 6.733786106109619, 7.132227420806885, 7.53066873550415, 7.929110050201416, 8.327550888061523, 8.725992202758789, 9.124433517456055, 9.52287483215332, 9.921316146850586, 10.319757461547852, 10.718198776245117, 11.116640090942383, 11.515081405639648, 11.913522720336914, 12.31196403503418, 12.710405349731445]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 16.0, 16.0, 24.0, 38.0, 42.0, 86.0, 131.0, 183.0, 339.0, 518.0, 948.0, 1668.0, 3014.0, 5514.0, 10737.0, 21929.0, 45424.0, 90352.0, 159244.0, 216539.0, 204971.0, 137976.0, 74815.0, 36580.0, 17857.0, 8841.0, 4716.0, 2535.0, 1393.0, 807.0, 482.0, 320.0, 148.0, 134.0, 71.0, 46.0, 29.0, 13.0, 16.0, 8.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.9130859375, -1.8548583984375, -1.796630859375, -1.7384033203125, -1.68017578125, -1.6219482421875, -1.563720703125, -1.5054931640625, -1.447265625, -1.3890380859375, -1.330810546875, -1.2725830078125, -1.21435546875, -1.1561279296875, -1.097900390625, -1.0396728515625, -0.9814453125, -0.9232177734375, -0.864990234375, -0.8067626953125, -0.74853515625, -0.6903076171875, -0.632080078125, -0.5738525390625, -0.515625, -0.4573974609375, -0.399169921875, -0.3409423828125, -0.28271484375, -0.2244873046875, -0.166259765625, -0.1080322265625, -0.0498046875, 0.0084228515625, 0.066650390625, 0.1248779296875, 0.18310546875, 0.2413330078125, 0.299560546875, 0.3577880859375, 0.416015625, 0.4742431640625, 0.532470703125, 0.5906982421875, 0.64892578125, 0.7071533203125, 0.765380859375, 0.8236083984375, 0.8818359375, 0.9400634765625, 0.998291015625, 1.0565185546875, 1.11474609375, 1.1729736328125, 1.231201171875, 1.2894287109375, 1.34765625, 1.4058837890625, 1.464111328125, 1.5223388671875, 1.58056640625, 1.6387939453125, 1.697021484375, 1.7552490234375, 1.8134765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 11.0, 9.0, 8.0, 19.0, 13.0, 12.0, 28.0, 40.0, 30.0, 42.0, 39.0, 54.0, 47.0, 61.0, 55.0, 62.0, 59.0, 34.0, 59.0, 44.0, 42.0, 39.0, 42.0, 35.0, 20.0, 16.0, 30.0, 12.0, 8.0, 13.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.473846435546875, -1.40277099609375, -1.331695556640625, -1.2606201171875, -1.189544677734375, -1.11846923828125, -1.047393798828125, -0.976318359375, -0.905242919921875, -0.83416748046875, -0.763092041015625, -0.6920166015625, -0.620941162109375, -0.54986572265625, -0.478790283203125, -0.40771484375, -0.336639404296875, -0.26556396484375, -0.194488525390625, -0.1234130859375, -0.052337646484375, 0.01873779296875, 0.089813232421875, 0.160888671875, 0.231964111328125, 0.30303955078125, 0.374114990234375, 0.4451904296875, 0.516265869140625, 0.58734130859375, 0.658416748046875, 0.7294921875, 0.800567626953125, 0.87164306640625, 0.942718505859375, 1.0137939453125, 1.084869384765625, 1.15594482421875, 1.227020263671875, 1.298095703125, 1.369171142578125, 1.44024658203125, 1.511322021484375, 1.5823974609375, 1.653472900390625, 1.72454833984375, 1.795623779296875, 1.86669921875, 1.937774658203125, 2.00885009765625, 2.079925537109375, 2.1510009765625, 2.222076416015625, 2.29315185546875, 2.364227294921875, 2.435302734375, 2.506378173828125, 2.57745361328125, 2.648529052734375, 2.7196044921875, 2.790679931640625, 2.86175537109375, 2.932830810546875, 3.00390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 13.0, 23.0, 23.0, 25.0, 61.0, 110.0, 148.0, 233.0, 405.0, 713.0, 1476.0, 2910.0, 6636.0, 17009.0, 47724.0, 131961.0, 277248.0, 302332.0, 162466.0, 60138.0, 21452.0, 8116.0, 3505.0, 1644.0, 884.0, 473.0, 285.0, 171.0, 115.0, 78.0, 49.0, 38.0, 29.0, 12.0, 9.0, 5.0, 5.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.27545166015625, -2.1915283203125, -2.10760498046875, -2.023681640625, -1.93975830078125, -1.8558349609375, -1.77191162109375, -1.68798828125, -1.60406494140625, -1.5201416015625, -1.43621826171875, -1.352294921875, -1.26837158203125, -1.1844482421875, -1.10052490234375, -1.0166015625, -0.93267822265625, -0.8487548828125, -0.76483154296875, -0.680908203125, -0.59698486328125, -0.5130615234375, -0.42913818359375, -0.34521484375, -0.26129150390625, -0.1773681640625, -0.09344482421875, -0.009521484375, 0.07440185546875, 0.1583251953125, 0.24224853515625, 0.326171875, 0.41009521484375, 0.4940185546875, 0.57794189453125, 0.661865234375, 0.74578857421875, 0.8297119140625, 0.91363525390625, 0.99755859375, 1.08148193359375, 1.1654052734375, 1.24932861328125, 1.333251953125, 1.41717529296875, 1.5010986328125, 1.58502197265625, 1.6689453125, 1.75286865234375, 1.8367919921875, 1.92071533203125, 2.004638671875, 2.08856201171875, 2.1724853515625, 2.25640869140625, 2.34033203125, 2.42425537109375, 2.5081787109375, 2.59210205078125, 2.676025390625, 2.75994873046875, 2.8438720703125, 2.92779541015625, 3.01171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 9.0, 5.0, 5.0, 15.0, 10.0, 12.0, 25.0, 18.0, 20.0, 37.0, 38.0, 44.0, 46.0, 56.0, 48.0, 48.0, 43.0, 53.0, 51.0, 41.0, 41.0, 52.0, 53.0, 39.0, 40.0, 34.0, 26.0, 25.0, 23.0, 15.0, 9.0, 8.0, 6.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.70703125, -6.5067138671875, -6.306396484375, -6.1060791015625, -5.90576171875, -5.7054443359375, -5.505126953125, -5.3048095703125, -5.1044921875, -4.9041748046875, -4.703857421875, -4.5035400390625, -4.30322265625, -4.1029052734375, -3.902587890625, -3.7022705078125, -3.501953125, -3.3016357421875, -3.101318359375, -2.9010009765625, -2.70068359375, -2.5003662109375, -2.300048828125, -2.0997314453125, -1.8994140625, -1.6990966796875, -1.498779296875, -1.2984619140625, -1.09814453125, -0.8978271484375, -0.697509765625, -0.4971923828125, -0.296875, -0.0965576171875, 0.103759765625, 0.3040771484375, 0.50439453125, 0.7047119140625, 0.905029296875, 1.1053466796875, 1.3056640625, 1.5059814453125, 1.706298828125, 1.9066162109375, 2.10693359375, 2.3072509765625, 2.507568359375, 2.7078857421875, 2.908203125, 3.1085205078125, 3.308837890625, 3.5091552734375, 3.70947265625, 3.9097900390625, 4.110107421875, 4.3104248046875, 4.5107421875, 4.7110595703125, 4.911376953125, 5.1116943359375, 5.31201171875, 5.5123291015625, 5.712646484375, 5.9129638671875, 6.11328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 7.0, 8.0, 18.0, 11.0, 14.0, 40.0, 67.0, 98.0, 153.0, 233.0, 443.0, 777.0, 1380.0, 2783.0, 5358.0, 10898.0, 21730.0, 44300.0, 88553.0, 158231.0, 221579.0, 208569.0, 137132.0, 73341.0, 36640.0, 17853.0, 8756.0, 4414.0, 2307.0, 1198.0, 662.0, 403.0, 204.0, 122.0, 96.0, 57.0, 31.0, 31.0, 16.0, 14.0, 11.0, 10.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8592605590820312, -0.8322906494140625, -0.8053207397460938, -0.778350830078125, -0.7513809204101562, -0.7244110107421875, -0.6974411010742188, -0.67047119140625, -0.6435012817382812, -0.6165313720703125, -0.5895614624023438, -0.562591552734375, -0.5356216430664062, -0.5086517333984375, -0.48168182373046875, -0.4547119140625, -0.42774200439453125, -0.4007720947265625, -0.37380218505859375, -0.346832275390625, -0.31986236572265625, -0.2928924560546875, -0.26592254638671875, -0.23895263671875, -0.21198272705078125, -0.1850128173828125, -0.15804290771484375, -0.131072998046875, -0.10410308837890625, -0.0771331787109375, -0.05016326904296875, -0.023193359375, 0.00377655029296875, 0.0307464599609375, 0.05771636962890625, 0.084686279296875, 0.11165618896484375, 0.1386260986328125, 0.16559600830078125, 0.19256591796875, 0.21953582763671875, 0.2465057373046875, 0.27347564697265625, 0.300445556640625, 0.32741546630859375, 0.3543853759765625, 0.38135528564453125, 0.4083251953125, 0.43529510498046875, 0.4622650146484375, 0.48923492431640625, 0.516204833984375, 0.5431747436523438, 0.5701446533203125, 0.5971145629882812, 0.62408447265625, 0.6510543823242188, 0.6780242919921875, 0.7049942016601562, 0.731964111328125, 0.7589340209960938, 0.7859039306640625, 0.8128738403320312, 0.83984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 7.0, 5.0, 4.0, 8.0, 8.0, 11.0, 11.0, 14.0, 18.0, 26.0, 23.0, 26.0, 37.0, 36.0, 64.0, 53.0, 68.0, 72.0, 70.0, 50.0, 59.0, 64.0, 46.0, 42.0, 26.0, 27.0, 26.0, 15.0, 16.0, 13.0, 12.0, 8.0, 8.0, 5.0, 10.0, 2.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002887248992919922, -0.00028036534786224365, -0.0002720057964324951, -0.0002636462450027466, -0.00025528669357299805, -0.0002469271421432495, -0.00023856759071350098, -0.00023020803928375244, -0.0002218484878540039, -0.00021348893642425537, -0.00020512938499450684, -0.0001967698335647583, -0.00018841028213500977, -0.00018005073070526123, -0.0001716911792755127, -0.00016333162784576416, -0.00015497207641601562, -0.0001466125249862671, -0.00013825297355651855, -0.00012989342212677002, -0.00012153387069702148, -0.00011317431926727295, -0.00010481476783752441, -9.645521640777588e-05, -8.809566497802734e-05, -7.973611354827881e-05, -7.137656211853027e-05, -6.301701068878174e-05, -5.46574592590332e-05, -4.629790782928467e-05, -3.793835639953613e-05, -2.9578804969787598e-05, -2.1219253540039062e-05, -1.2859702110290527e-05, -4.500150680541992e-06, 3.859400749206543e-06, 1.2218952178955078e-05, 2.0578503608703613e-05, 2.893805503845215e-05, 3.7297606468200684e-05, 4.565715789794922e-05, 5.4016709327697754e-05, 6.237626075744629e-05, 7.073581218719482e-05, 7.909536361694336e-05, 8.74549150466919e-05, 9.581446647644043e-05, 0.00010417401790618896, 0.0001125335693359375, 0.00012089312076568604, 0.00012925267219543457, 0.0001376122236251831, 0.00014597177505493164, 0.00015433132648468018, 0.0001626908779144287, 0.00017105042934417725, 0.00017940998077392578, 0.00018776953220367432, 0.00019612908363342285, 0.0002044886350631714, 0.00021284818649291992, 0.00022120773792266846, 0.000229567289352417, 0.00023792684078216553, 0.00024628639221191406]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 10.0, 13.0, 18.0, 23.0, 67.0, 78.0, 141.0, 277.0, 482.0, 937.0, 1985.0, 4340.0, 10329.0, 24901.0, 61953.0, 139045.0, 239127.0, 258411.0, 169475.0, 79592.0, 33146.0, 13368.0, 5693.0, 2570.0, 1218.0, 599.0, 299.0, 173.0, 119.0, 53.0, 37.0, 33.0, 8.0, 10.0, 9.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91650390625, -0.8850631713867188, -0.8536224365234375, -0.8221817016601562, -0.790740966796875, -0.7593002319335938, -0.7278594970703125, -0.6964187622070312, -0.66497802734375, -0.6335372924804688, -0.6020965576171875, -0.5706558227539062, -0.539215087890625, -0.5077743530273438, -0.4763336181640625, -0.44489288330078125, -0.4134521484375, -0.38201141357421875, -0.3505706787109375, -0.31912994384765625, -0.287689208984375, -0.25624847412109375, -0.2248077392578125, -0.19336700439453125, -0.16192626953125, -0.13048553466796875, -0.0990447998046875, -0.06760406494140625, -0.036163330078125, -0.00472259521484375, 0.0267181396484375, 0.05815887451171875, 0.089599609375, 0.12104034423828125, 0.1524810791015625, 0.18392181396484375, 0.215362548828125, 0.24680328369140625, 0.2782440185546875, 0.30968475341796875, 0.34112548828125, 0.37256622314453125, 0.4040069580078125, 0.43544769287109375, 0.466888427734375, 0.49832916259765625, 0.5297698974609375, 0.5612106323242188, 0.5926513671875, 0.6240921020507812, 0.6555328369140625, 0.6869735717773438, 0.718414306640625, 0.7498550415039062, 0.7812957763671875, 0.8127365112304688, 0.84417724609375, 0.8756179809570312, 0.9070587158203125, 0.9384994506835938, 0.969940185546875, 1.0013809204101562, 1.0328216552734375, 1.0642623901367188, 1.095703125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 10.0, 14.0, 11.0, 17.0, 25.0, 21.0, 23.0, 18.0, 31.0, 36.0, 40.0, 55.0, 42.0, 71.0, 50.0, 63.0, 55.0, 45.0, 56.0, 51.0, 30.0, 31.0, 37.0, 27.0, 30.0, 25.0, 18.0, 19.0, 8.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.162109375, -1.1287155151367188, -1.0953216552734375, -1.0619277954101562, -1.028533935546875, -0.9951400756835938, -0.9617462158203125, -0.9283523559570312, -0.89495849609375, -0.8615646362304688, -0.8281707763671875, -0.7947769165039062, -0.761383056640625, -0.7279891967773438, -0.6945953369140625, -0.6612014770507812, -0.6278076171875, -0.5944137573242188, -0.5610198974609375, -0.5276260375976562, -0.494232177734375, -0.46083831787109375, -0.4274444580078125, -0.39405059814453125, -0.36065673828125, -0.32726287841796875, -0.2938690185546875, -0.26047515869140625, -0.227081298828125, -0.19368743896484375, -0.1602935791015625, -0.12689971923828125, -0.093505859375, -0.06011199951171875, -0.0267181396484375, 0.00667572021484375, 0.040069580078125, 0.07346343994140625, 0.1068572998046875, 0.14025115966796875, 0.17364501953125, 0.20703887939453125, 0.2404327392578125, 0.27382659912109375, 0.307220458984375, 0.34061431884765625, 0.3740081787109375, 0.40740203857421875, 0.4407958984375, 0.47418975830078125, 0.5075836181640625, 0.5409774780273438, 0.574371337890625, 0.6077651977539062, 0.6411590576171875, 0.6745529174804688, 0.70794677734375, 0.7413406372070312, 0.7747344970703125, 0.8081283569335938, 0.841522216796875, 0.8749160766601562, 0.9083099365234375, 0.9417037963867188, 0.97509765625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 9.0, 13.0, 20.0, 86.0, 174.0, 259.0, 200.0, 133.0, 71.0, 22.0, 7.0, 2.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.65446472167969, -31.742692947387695, -30.830921173095703, -29.91914939880371, -29.00737762451172, -28.09560775756836, -27.183834075927734, -26.272064208984375, -25.360292434692383, -24.44852066040039, -23.5367488861084, -22.624977111816406, -21.713205337524414, -20.801433563232422, -19.889663696289062, -18.97789192199707, -18.066120147705078, -17.154348373413086, -16.242576599121094, -15.330804824829102, -14.419034004211426, -13.507262229919434, -12.595490455627441, -11.683719635009766, -10.77194595336914, -9.860174179077148, -8.948402404785156, -8.036630630493164, -7.124859809875488, -6.213088035583496, -5.301316261291504, -4.38954496383667, -3.477773666381836, -2.566002130508423, -1.6542304754257202, -0.7424588203430176, 0.1693127155303955, 1.0810842514038086, 1.9928560256958008, 2.9046273231506348, 3.816399097442627, 4.728170871734619, 5.639942169189453, 6.551713943481445, 7.4634857177734375, 8.37525749206543, 9.287029266357422, 10.198800086975098, 11.11057186126709, 12.022343635559082, 12.934115409851074, 13.84588623046875, 14.757658004760742, 15.669429779052734, 16.581201553344727, 17.49297332763672, 18.40474510192871, 19.316516876220703, 20.228288650512695, 21.140060424804688, 22.05183219909668, 22.963603973388672, 23.87537384033203, 24.787145614624023, 25.698917388916016]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 10.0, 11.0, 17.0, 19.0, 16.0, 18.0, 13.0, 15.0, 26.0, 27.0, 26.0, 43.0, 37.0, 46.0, 36.0, 41.0, 39.0, 45.0, 50.0, 37.0, 40.0, 31.0, 38.0, 35.0, 38.0, 27.0, 30.0, 27.0, 24.0, 19.0, 25.0, 12.0, 8.0, 13.0, 8.0, 12.0, 10.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.338685989379883, -14.875646591186523, -14.41260814666748, -13.949569702148438, -13.486530303955078, -13.023490905761719, -12.560452461242676, -12.097414016723633, -11.634374618530273, -11.171335220336914, -10.708296775817871, -10.245258331298828, -9.782218933105469, -9.31917953491211, -8.856141090393066, -8.393102645874023, -7.930063247680664, -7.467024326324463, -7.003985404968262, -6.5409464836120605, -6.077907562255859, -5.614868640899658, -5.151829719543457, -4.688790798187256, -4.225751876831055, -3.7627129554748535, -3.2996740341186523, -2.836635112762451, -2.37359619140625, -1.9105572700500488, -1.4475183486938477, -0.9844794273376465, -0.5214405059814453, -0.05840158462524414, 0.40463733673095703, 0.8676762580871582, 1.3307151794433594, 1.7937541007995605, 2.2567930221557617, 2.719831943511963, 3.182870864868164, 3.6459097862243652, 4.108948707580566, 4.571987628936768, 5.035026550292969, 5.49806547164917, 5.961104393005371, 6.424143314361572, 6.887182235717773, 7.350221157073975, 7.813260078430176, 8.276298522949219, 8.739337921142578, 9.202377319335938, 9.66541576385498, 10.128454208374023, 10.591493606567383, 11.054533004760742, 11.517571449279785, 11.980609893798828, 12.443649291992188, 12.906688690185547, 13.36972713470459, 13.832765579223633, 14.295804977416992]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 8.0, 16.0, 31.0, 32.0, 99.0, 169.0, 353.0, 661.0, 1421.0, 3081.0, 7308.0, 19262.0, 61370.0, 248718.0, 1055858.0, 1922754.0, 669899.0, 143621.0, 37275.0, 12338.0, 5030.0, 2273.0, 1148.0, 635.0, 335.0, 190.0, 118.0, 82.0, 55.0, 39.0, 18.0, 21.0, 24.0, 12.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.17578125, -2.089874267578125, -2.00396728515625, -1.918060302734375, -1.8321533203125, -1.746246337890625, -1.66033935546875, -1.574432373046875, -1.488525390625, -1.402618408203125, -1.31671142578125, -1.230804443359375, -1.1448974609375, -1.058990478515625, -0.97308349609375, -0.887176513671875, -0.80126953125, -0.715362548828125, -0.62945556640625, -0.543548583984375, -0.4576416015625, -0.371734619140625, -0.28582763671875, -0.199920654296875, -0.114013671875, -0.028106689453125, 0.05780029296875, 0.143707275390625, 0.2296142578125, 0.315521240234375, 0.40142822265625, 0.487335205078125, 0.5732421875, 0.659149169921875, 0.74505615234375, 0.830963134765625, 0.9168701171875, 1.002777099609375, 1.08868408203125, 1.174591064453125, 1.260498046875, 1.346405029296875, 1.43231201171875, 1.518218994140625, 1.6041259765625, 1.690032958984375, 1.77593994140625, 1.861846923828125, 1.94775390625, 2.033660888671875, 2.11956787109375, 2.205474853515625, 2.2913818359375, 2.377288818359375, 2.46319580078125, 2.549102783203125, 2.635009765625, 2.720916748046875, 2.80682373046875, 2.892730712890625, 2.9786376953125, 3.064544677734375, 3.15045166015625, 3.236358642578125, 3.322265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 9.0, 9.0, 12.0, 16.0, 21.0, 20.0, 20.0, 24.0, 30.0, 41.0, 42.0, 40.0, 50.0, 49.0, 56.0, 38.0, 53.0, 49.0, 44.0, 44.0, 42.0, 40.0, 39.0, 29.0, 29.0, 24.0, 30.0, 19.0, 17.0, 12.0, 12.0, 7.0, 10.0, 5.0, 6.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.23046875, -2.157379150390625, -2.08428955078125, -2.011199951171875, -1.9381103515625, -1.865020751953125, -1.79193115234375, -1.718841552734375, -1.645751953125, -1.572662353515625, -1.49957275390625, -1.426483154296875, -1.3533935546875, -1.280303955078125, -1.20721435546875, -1.134124755859375, -1.06103515625, -0.987945556640625, -0.91485595703125, -0.841766357421875, -0.7686767578125, -0.695587158203125, -0.62249755859375, -0.549407958984375, -0.476318359375, -0.403228759765625, -0.33013916015625, -0.257049560546875, -0.1839599609375, -0.110870361328125, -0.03778076171875, 0.035308837890625, 0.1083984375, 0.181488037109375, 0.25457763671875, 0.327667236328125, 0.4007568359375, 0.473846435546875, 0.54693603515625, 0.620025634765625, 0.693115234375, 0.766204833984375, 0.83929443359375, 0.912384033203125, 0.9854736328125, 1.058563232421875, 1.13165283203125, 1.204742431640625, 1.27783203125, 1.350921630859375, 1.42401123046875, 1.497100830078125, 1.5701904296875, 1.643280029296875, 1.71636962890625, 1.789459228515625, 1.862548828125, 1.935638427734375, 2.00872802734375, 2.081817626953125, 2.1549072265625, 2.227996826171875, 2.30108642578125, 2.374176025390625, 2.447265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 3.0, 10.0, 10.0, 8.0, 23.0, 33.0, 49.0, 76.0, 122.0, 214.0, 362.0, 608.0, 1239.0, 2830.0, 7202.0, 21154.0, 75416.0, 347314.0, 2280736.0, 1199859.0, 188520.0, 45679.0, 13686.0, 4922.0, 2005.0, 984.0, 500.0, 266.0, 165.0, 104.0, 57.0, 40.0, 27.0, 22.0, 7.0, 9.0, 11.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.56640625, -3.44677734375, -3.3271484375, -3.20751953125, -3.087890625, -2.96826171875, -2.8486328125, -2.72900390625, -2.609375, -2.48974609375, -2.3701171875, -2.25048828125, -2.130859375, -2.01123046875, -1.8916015625, -1.77197265625, -1.65234375, -1.53271484375, -1.4130859375, -1.29345703125, -1.173828125, -1.05419921875, -0.9345703125, -0.81494140625, -0.6953125, -0.57568359375, -0.4560546875, -0.33642578125, -0.216796875, -0.09716796875, 0.0224609375, 0.14208984375, 0.26171875, 0.38134765625, 0.5009765625, 0.62060546875, 0.740234375, 0.85986328125, 0.9794921875, 1.09912109375, 1.21875, 1.33837890625, 1.4580078125, 1.57763671875, 1.697265625, 1.81689453125, 1.9365234375, 2.05615234375, 2.17578125, 2.29541015625, 2.4150390625, 2.53466796875, 2.654296875, 2.77392578125, 2.8935546875, 3.01318359375, 3.1328125, 3.25244140625, 3.3720703125, 3.49169921875, 3.611328125, 3.73095703125, 3.8505859375, 3.97021484375, 4.08984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 5.0, 13.0, 11.0, 26.0, 22.0, 43.0, 47.0, 47.0, 96.0, 141.0, 225.0, 386.0, 633.0, 790.0, 569.0, 354.0, 206.0, 155.0, 96.0, 58.0, 32.0, 29.0, 25.0, 14.0, 13.0, 9.0, 12.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21484375, -4.07171630859375, -3.9285888671875, -3.78546142578125, -3.642333984375, -3.49920654296875, -3.3560791015625, -3.21295166015625, -3.06982421875, -2.92669677734375, -2.7835693359375, -2.64044189453125, -2.497314453125, -2.35418701171875, -2.2110595703125, -2.06793212890625, -1.9248046875, -1.78167724609375, -1.6385498046875, -1.49542236328125, -1.352294921875, -1.20916748046875, -1.0660400390625, -0.92291259765625, -0.77978515625, -0.63665771484375, -0.4935302734375, -0.35040283203125, -0.207275390625, -0.06414794921875, 0.0789794921875, 0.22210693359375, 0.365234375, 0.50836181640625, 0.6514892578125, 0.79461669921875, 0.937744140625, 1.08087158203125, 1.2239990234375, 1.36712646484375, 1.51025390625, 1.65338134765625, 1.7965087890625, 1.93963623046875, 2.082763671875, 2.22589111328125, 2.3690185546875, 2.51214599609375, 2.6552734375, 2.79840087890625, 2.9415283203125, 3.08465576171875, 3.227783203125, 3.37091064453125, 3.5140380859375, 3.65716552734375, 3.80029296875, 3.94342041015625, 4.0865478515625, 4.22967529296875, 4.372802734375, 4.51593017578125, 4.6590576171875, 4.80218505859375, 4.9453125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 32.0, 60.0, 166.0, 225.0, 250.0, 151.0, 66.0, 26.0, 10.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.8653564453125, -54.594322204589844, -53.32328796386719, -52.0522575378418, -50.78122329711914, -49.510189056396484, -48.239158630371094, -46.96812438964844, -45.69709014892578, -44.426055908203125, -43.15502166748047, -41.88399124145508, -40.61295700073242, -39.341922760009766, -38.070892333984375, -36.79985809326172, -35.52882385253906, -34.257789611816406, -32.98675537109375, -31.71572494506836, -30.444690704345703, -29.173656463623047, -27.902624130249023, -26.631591796875, -25.360557556152344, -24.089523315429688, -22.818490982055664, -21.54745864868164, -20.276424407958984, -19.005390167236328, -17.734357833862305, -16.46332550048828, -15.192291259765625, -13.921257972717285, -12.650224685668945, -11.379191398620605, -10.108158111572266, -8.837124824523926, -7.566091537475586, -6.295058250427246, -5.024024963378906, -3.7529916763305664, -2.4819583892822266, -1.2109251022338867, 0.060108184814453125, 1.331141471862793, 2.602174758911133, 3.8732080459594727, 5.1442413330078125, 6.415274620056152, 7.686307907104492, 8.957341194152832, 10.228374481201172, 11.499407768249512, 12.770441055297852, 14.041474342346191, 15.312507629394531, 16.583541870117188, 17.85457420349121, 19.125606536865234, 20.39664077758789, 21.667675018310547, 22.93870735168457, 24.209739685058594, 25.48077392578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 3.0, 18.0, 11.0, 9.0, 12.0, 12.0, 19.0, 16.0, 16.0, 21.0, 17.0, 26.0, 34.0, 32.0, 35.0, 37.0, 33.0, 40.0, 40.0, 41.0, 32.0, 40.0, 39.0, 33.0, 33.0, 31.0, 35.0, 35.0, 26.0, 20.0, 21.0, 26.0, 30.0, 17.0, 16.0, 11.0, 11.0, 13.0, 11.0, 6.0, 6.0, 6.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-10.014322280883789, -9.704379081726074, -9.39443588256836, -9.084493637084961, -8.774550437927246, -8.464607238769531, -8.154664039611816, -7.844720840454102, -7.534777641296387, -7.224834442138672, -6.914891719818115, -6.6049485206604, -6.2950053215026855, -5.985062599182129, -5.675119400024414, -5.365176200866699, -5.055233478546143, -4.745290279388428, -4.435347557067871, -4.125404357910156, -3.8154611587524414, -3.5055181980133057, -3.19557523727417, -2.885632038116455, -2.5756890773773193, -2.2657461166381836, -1.9558029174804688, -1.645859956741333, -1.3359168767929077, -1.0259737968444824, -0.7160308361053467, -0.40608763694763184, -0.0961446762084961, 0.2137983739376068, 0.5237414240837097, 0.8336844444274902, 1.1436275243759155, 1.4535706043243408, 1.7635135650634766, 2.0734567642211914, 2.383399724960327, 2.693342685699463, 3.0032858848571777, 3.3132288455963135, 3.623171806335449, 3.933115005493164, 4.243058204650879, 4.553001403808594, 4.86294412612915, 5.172887325286865, 5.482830047607422, 5.792773246765137, 6.102716445922852, 6.412659645080566, 6.722602367401123, 7.032545566558838, 7.3424882888793945, 7.652431488037109, 7.962374210357666, 8.272317886352539, 8.582260131835938, 8.892203330993652, 9.202146530151367, 9.512089729309082, 9.822032928466797]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 3.0, 10.0, 14.0, 9.0, 23.0, 30.0, 47.0, 71.0, 99.0, 211.0, 365.0, 599.0, 1225.0, 2607.0, 5247.0, 11296.0, 27321.0, 89113.0, 300838.0, 393388.0, 145824.0, 41225.0, 15106.0, 6833.0, 3376.0, 1672.0, 895.0, 476.0, 245.0, 154.0, 80.0, 51.0, 36.0, 17.0, 19.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.712890625, -3.593841552734375, -3.47479248046875, -3.355743408203125, -3.2366943359375, -3.117645263671875, -2.99859619140625, -2.879547119140625, -2.760498046875, -2.641448974609375, -2.52239990234375, -2.403350830078125, -2.2843017578125, -2.165252685546875, -2.04620361328125, -1.927154541015625, -1.80810546875, -1.689056396484375, -1.57000732421875, -1.450958251953125, -1.3319091796875, -1.212860107421875, -1.09381103515625, -0.974761962890625, -0.855712890625, -0.736663818359375, -0.61761474609375, -0.498565673828125, -0.3795166015625, -0.260467529296875, -0.14141845703125, -0.022369384765625, 0.0966796875, 0.215728759765625, 0.33477783203125, 0.453826904296875, 0.5728759765625, 0.691925048828125, 0.81097412109375, 0.930023193359375, 1.049072265625, 1.168121337890625, 1.28717041015625, 1.406219482421875, 1.5252685546875, 1.644317626953125, 1.76336669921875, 1.882415771484375, 2.00146484375, 2.120513916015625, 2.23956298828125, 2.358612060546875, 2.4776611328125, 2.596710205078125, 2.71575927734375, 2.834808349609375, 2.953857421875, 3.072906494140625, 3.19195556640625, 3.311004638671875, 3.4300537109375, 3.549102783203125, 3.66815185546875, 3.787200927734375, 3.90625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 8.0, 7.0, 3.0, 8.0, 8.0, 15.0, 16.0, 17.0, 21.0, 27.0, 33.0, 36.0, 48.0, 35.0, 38.0, 57.0, 48.0, 58.0, 51.0, 48.0, 48.0, 45.0, 51.0, 50.0, 36.0, 34.0, 29.0, 18.0, 16.0, 15.0, 19.0, 9.0, 11.0, 8.0, 11.0, 7.0, 8.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.6155242919921875, -1.544525146484375, -1.4735260009765625, -1.40252685546875, -1.3315277099609375, -1.260528564453125, -1.1895294189453125, -1.1185302734375, -1.0475311279296875, -0.976531982421875, -0.9055328369140625, -0.83453369140625, -0.7635345458984375, -0.692535400390625, -0.6215362548828125, -0.550537109375, -0.4795379638671875, -0.408538818359375, -0.3375396728515625, -0.26654052734375, -0.1955413818359375, -0.124542236328125, -0.0535430908203125, 0.0174560546875, 0.0884552001953125, 0.159454345703125, 0.2304534912109375, 0.30145263671875, 0.3724517822265625, 0.443450927734375, 0.5144500732421875, 0.58544921875, 0.6564483642578125, 0.727447509765625, 0.7984466552734375, 0.86944580078125, 0.9404449462890625, 1.011444091796875, 1.0824432373046875, 1.1534423828125, 1.2244415283203125, 1.295440673828125, 1.3664398193359375, 1.43743896484375, 1.5084381103515625, 1.579437255859375, 1.6504364013671875, 1.721435546875, 1.7924346923828125, 1.863433837890625, 1.9344329833984375, 2.00543212890625, 2.0764312744140625, 2.147430419921875, 2.2184295654296875, 2.2894287109375, 2.3604278564453125, 2.431427001953125, 2.5024261474609375, 2.57342529296875, 2.6444244384765625, 2.715423583984375, 2.7864227294921875, 2.857421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 4.0, 12.0, 11.0, 15.0, 19.0, 38.0, 43.0, 61.0, 63.0, 117.0, 221.0, 325.0, 616.0, 1014.0, 1971.0, 3408.0, 6317.0, 12293.0, 25411.0, 57903.0, 149352.0, 311297.0, 272042.0, 116766.0, 45777.0, 20757.0, 10479.0, 5372.0, 2941.0, 1502.0, 935.0, 523.0, 308.0, 203.0, 126.0, 88.0, 53.0, 49.0, 29.0, 20.0, 16.0, 17.0, 11.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.73828125, -2.6466064453125, -2.554931640625, -2.4632568359375, -2.37158203125, -2.2799072265625, -2.188232421875, -2.0965576171875, -2.0048828125, -1.9132080078125, -1.821533203125, -1.7298583984375, -1.63818359375, -1.5465087890625, -1.454833984375, -1.3631591796875, -1.271484375, -1.1798095703125, -1.088134765625, -0.9964599609375, -0.90478515625, -0.8131103515625, -0.721435546875, -0.6297607421875, -0.5380859375, -0.4464111328125, -0.354736328125, -0.2630615234375, -0.17138671875, -0.0797119140625, 0.011962890625, 0.1036376953125, 0.1953125, 0.2869873046875, 0.378662109375, 0.4703369140625, 0.56201171875, 0.6536865234375, 0.745361328125, 0.8370361328125, 0.9287109375, 1.0203857421875, 1.112060546875, 1.2037353515625, 1.29541015625, 1.3870849609375, 1.478759765625, 1.5704345703125, 1.662109375, 1.7537841796875, 1.845458984375, 1.9371337890625, 2.02880859375, 2.1204833984375, 2.212158203125, 2.3038330078125, 2.3955078125, 2.4871826171875, 2.578857421875, 2.6705322265625, 2.76220703125, 2.8538818359375, 2.945556640625, 3.0372314453125, 3.12890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 2.0, 7.0, 9.0, 8.0, 12.0, 13.0, 21.0, 13.0, 23.0, 23.0, 25.0, 31.0, 32.0, 38.0, 40.0, 51.0, 59.0, 37.0, 51.0, 50.0, 40.0, 40.0, 50.0, 37.0, 36.0, 36.0, 25.0, 22.0, 18.0, 29.0, 20.0, 18.0, 17.0, 10.0, 5.0, 5.0, 4.0, 6.0, 6.0, 4.0, 6.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-6.48046875, -6.26605224609375, -6.0516357421875, -5.83721923828125, -5.622802734375, -5.40838623046875, -5.1939697265625, -4.97955322265625, -4.76513671875, -4.55072021484375, -4.3363037109375, -4.12188720703125, -3.907470703125, -3.69305419921875, -3.4786376953125, -3.26422119140625, -3.0498046875, -2.83538818359375, -2.6209716796875, -2.40655517578125, -2.192138671875, -1.97772216796875, -1.7633056640625, -1.54888916015625, -1.33447265625, -1.12005615234375, -0.9056396484375, -0.69122314453125, -0.476806640625, -0.26239013671875, -0.0479736328125, 0.16644287109375, 0.380859375, 0.59527587890625, 0.8096923828125, 1.02410888671875, 1.238525390625, 1.45294189453125, 1.6673583984375, 1.88177490234375, 2.09619140625, 2.31060791015625, 2.5250244140625, 2.73944091796875, 2.953857421875, 3.16827392578125, 3.3826904296875, 3.59710693359375, 3.8115234375, 4.02593994140625, 4.2403564453125, 4.45477294921875, 4.669189453125, 4.88360595703125, 5.0980224609375, 5.31243896484375, 5.52685546875, 5.74127197265625, 5.9556884765625, 6.17010498046875, 6.384521484375, 6.59893798828125, 6.8133544921875, 7.02777099609375, 7.2421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 5.0, 14.0, 27.0, 39.0, 61.0, 86.0, 134.0, 194.0, 317.0, 486.0, 784.0, 1273.0, 2142.0, 3486.0, 5674.0, 10381.0, 20005.0, 46476.0, 119441.0, 282416.0, 310863.0, 139543.0, 53877.0, 23150.0, 11544.0, 6402.0, 3747.0, 2305.0, 1365.0, 863.0, 515.0, 312.0, 223.0, 136.0, 111.0, 57.0, 42.0, 25.0, 11.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.034454345703125, -0.99761962890625, -0.960784912109375, -0.9239501953125, -0.887115478515625, -0.85028076171875, -0.813446044921875, -0.776611328125, -0.739776611328125, -0.70294189453125, -0.666107177734375, -0.6292724609375, -0.592437744140625, -0.55560302734375, -0.518768310546875, -0.48193359375, -0.445098876953125, -0.40826416015625, -0.371429443359375, -0.3345947265625, -0.297760009765625, -0.26092529296875, -0.224090576171875, -0.187255859375, -0.150421142578125, -0.11358642578125, -0.076751708984375, -0.0399169921875, -0.003082275390625, 0.03375244140625, 0.070587158203125, 0.107421875, 0.144256591796875, 0.18109130859375, 0.217926025390625, 0.2547607421875, 0.291595458984375, 0.32843017578125, 0.365264892578125, 0.402099609375, 0.438934326171875, 0.47576904296875, 0.512603759765625, 0.5494384765625, 0.586273193359375, 0.62310791015625, 0.659942626953125, 0.69677734375, 0.733612060546875, 0.77044677734375, 0.807281494140625, 0.8441162109375, 0.880950927734375, 0.91778564453125, 0.954620361328125, 0.991455078125, 1.028289794921875, 1.06512451171875, 1.101959228515625, 1.1387939453125, 1.175628662109375, 1.21246337890625, 1.249298095703125, 1.2861328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 14.0, 9.0, 16.0, 32.0, 54.0, 72.0, 128.0, 183.0, 147.0, 104.0, 54.0, 59.0, 37.0, 21.0, 13.0, 9.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006761550903320312, -0.0006555542349815369, -0.0006349533796310425, -0.0006143525242805481, -0.0005937516689300537, -0.0005731508135795593, -0.0005525499582290649, -0.0005319491028785706, -0.0005113482475280762, -0.0004907473921775818, -0.0004701465368270874, -0.000449545681476593, -0.00042894482612609863, -0.00040834397077560425, -0.00038774311542510986, -0.0003671422600746155, -0.0003465414047241211, -0.0003259405493736267, -0.0003053396940231323, -0.00028473883867263794, -0.00026413798332214355, -0.00024353712797164917, -0.00022293627262115479, -0.0002023354172706604, -0.00018173456192016602, -0.00016113370656967163, -0.00014053285121917725, -0.00011993199586868286, -9.933114051818848e-05, -7.873028516769409e-05, -5.812942981719971e-05, -3.752857446670532e-05, -1.6927719116210938e-05, 3.6731362342834473e-06, 2.4273991584777832e-05, 4.487484693527222e-05, 6.54757022857666e-05, 8.607655763626099e-05, 0.00010667741298675537, 0.00012727826833724976, 0.00014787912368774414, 0.00016847997903823853, 0.0001890808343887329, 0.0002096816897392273, 0.00023028254508972168, 0.00025088340044021606, 0.00027148425579071045, 0.00029208511114120483, 0.0003126859664916992, 0.0003332868218421936, 0.000353887677192688, 0.0003744885325431824, 0.00039508938789367676, 0.00041569024324417114, 0.00043629109859466553, 0.0004568919539451599, 0.0004774928092956543, 0.0004980936646461487, 0.0005186945199966431, 0.0005392953753471375, 0.0005598962306976318, 0.0005804970860481262, 0.0006010979413986206, 0.000621698796749115, 0.0006422996520996094]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 10.0, 7.0, 15.0, 21.0, 27.0, 43.0, 71.0, 100.0, 157.0, 242.0, 399.0, 676.0, 1195.0, 2051.0, 3620.0, 6650.0, 13219.0, 27648.0, 59486.0, 129740.0, 234820.0, 259966.0, 161617.0, 76939.0, 34703.0, 16552.0, 8218.0, 4413.0, 2407.0, 1424.0, 777.0, 503.0, 293.0, 192.0, 113.0, 69.0, 62.0, 30.0, 18.0, 20.0, 11.0, 8.0, 8.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0009765625, -0.9716720581054688, -0.9423675537109375, -0.9130630493164062, -0.883758544921875, -0.8544540405273438, -0.8251495361328125, -0.7958450317382812, -0.76654052734375, -0.7372360229492188, -0.7079315185546875, -0.6786270141601562, -0.649322509765625, -0.6200180053710938, -0.5907135009765625, -0.5614089965820312, -0.5321044921875, -0.5027999877929688, -0.4734954833984375, -0.44419097900390625, -0.414886474609375, -0.38558197021484375, -0.3562774658203125, -0.32697296142578125, -0.29766845703125, -0.26836395263671875, -0.2390594482421875, -0.20975494384765625, -0.180450439453125, -0.15114593505859375, -0.1218414306640625, -0.09253692626953125, -0.063232421875, -0.03392791748046875, -0.0046234130859375, 0.02468109130859375, 0.053985595703125, 0.08329010009765625, 0.1125946044921875, 0.14189910888671875, 0.17120361328125, 0.20050811767578125, 0.2298126220703125, 0.25911712646484375, 0.288421630859375, 0.31772613525390625, 0.3470306396484375, 0.37633514404296875, 0.4056396484375, 0.43494415283203125, 0.4642486572265625, 0.49355316162109375, 0.522857666015625, 0.5521621704101562, 0.5814666748046875, 0.6107711791992188, 0.64007568359375, 0.6693801879882812, 0.6986846923828125, 0.7279891967773438, 0.757293701171875, 0.7865982055664062, 0.8159027099609375, 0.8452072143554688, 0.87451171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 6.0, 9.0, 3.0, 16.0, 8.0, 14.0, 17.0, 30.0, 34.0, 39.0, 42.0, 56.0, 42.0, 65.0, 63.0, 59.0, 70.0, 62.0, 56.0, 54.0, 42.0, 29.0, 39.0, 19.0, 19.0, 19.0, 13.0, 13.0, 5.0, 2.0, 6.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.166015625, -1.1263580322265625, -1.086700439453125, -1.0470428466796875, -1.00738525390625, -0.9677276611328125, -0.928070068359375, -0.8884124755859375, -0.8487548828125, -0.8090972900390625, -0.769439697265625, -0.7297821044921875, -0.69012451171875, -0.6504669189453125, -0.610809326171875, -0.5711517333984375, -0.531494140625, -0.4918365478515625, -0.452178955078125, -0.4125213623046875, -0.37286376953125, -0.3332061767578125, -0.293548583984375, -0.2538909912109375, -0.2142333984375, -0.1745758056640625, -0.134918212890625, -0.0952606201171875, -0.05560302734375, -0.0159454345703125, 0.023712158203125, 0.0633697509765625, 0.10302734375, 0.1426849365234375, 0.182342529296875, 0.2220001220703125, 0.26165771484375, 0.3013153076171875, 0.340972900390625, 0.3806304931640625, 0.4202880859375, 0.4599456787109375, 0.499603271484375, 0.5392608642578125, 0.57891845703125, 0.6185760498046875, 0.658233642578125, 0.6978912353515625, 0.737548828125, 0.7772064208984375, 0.816864013671875, 0.8565216064453125, 0.89617919921875, 0.9358367919921875, 0.975494384765625, 1.0151519775390625, 1.0548095703125, 1.0944671630859375, 1.134124755859375, 1.1737823486328125, 1.21343994140625, 1.2530975341796875, 1.292755126953125, 1.3324127197265625, 1.3720703125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 9.0, 14.0, 23.0, 44.0, 61.0, 102.0, 124.0, 156.0, 149.0, 98.0, 85.0, 48.0, 26.0, 18.0, 9.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140583038330078, -16.473159790039062, -15.80573558807373, -15.138311386108398, -14.470888137817383, -13.803464889526367, -13.136040687561035, -12.468616485595703, -11.801193237304688, -11.133769989013672, -10.46634578704834, -9.798921585083008, -9.131498336791992, -8.464075088500977, -7.7966508865356445, -7.129227161407471, -6.461803436279297, -5.794379711151123, -5.126955986022949, -4.459532260894775, -3.7921085357666016, -3.1246848106384277, -2.457261085510254, -1.78983736038208, -1.1224136352539062, -0.4549899101257324, 0.2124338150024414, 0.8798575401306152, 1.547281265258789, 2.214704990386963, 2.8821287155151367, 3.5495524406433105, 4.216974258422852, 4.884397983551025, 5.551821708679199, 6.219245433807373, 6.886669158935547, 7.554092884063721, 8.221516609191895, 8.888940811157227, 9.556364059448242, 10.223787307739258, 10.89121150970459, 11.558635711669922, 12.226058959960938, 12.893482208251953, 13.560906410217285, 14.228330612182617, 14.895753860473633, 15.563177108764648, 16.230602264404297, 16.898025512695312, 17.565448760986328, 18.232872009277344, 18.90029525756836, 19.567720413208008, 20.235143661499023, 20.90256690979004, 21.569992065429688, 22.237415313720703, 22.90483856201172, 23.572261810302734, 24.23968505859375, 24.9071102142334, 25.574533462524414]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 1.0, 3.0, 4.0, 5.0, 8.0, 4.0, 10.0, 8.0, 6.0, 16.0, 22.0, 19.0, 31.0, 23.0, 26.0, 28.0, 32.0, 28.0, 34.0, 36.0, 43.0, 39.0, 40.0, 25.0, 41.0, 42.0, 38.0, 43.0, 40.0, 26.0, 34.0, 32.0, 35.0, 28.0, 30.0, 20.0, 19.0, 23.0, 14.0, 11.0, 8.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.676050186157227, -14.19009780883789, -13.704145431518555, -13.218193054199219, -12.732240676879883, -12.246288299560547, -11.760335922241211, -11.274383544921875, -10.788431167602539, -10.302478790283203, -9.816526412963867, -9.330574035644531, -8.844621658325195, -8.35866928100586, -7.872716903686523, -7.3867645263671875, -6.900811672210693, -6.414859294891357, -5.9289069175720215, -5.4429545402526855, -4.95700216293335, -4.4710493087768555, -3.9850971698760986, -3.4991447925567627, -3.0131924152374268, -2.527240037918091, -2.041287660598755, -1.5553351640701294, -1.0693827867507935, -0.583430290222168, -0.09747791290283203, 0.3884744644165039, 0.8744268417358398, 1.3603792190551758, 1.8463315963745117, 2.3322839736938477, 2.8182363510131836, 3.3041889667510986, 3.7901413440704346, 4.276093482971191, 4.762045860290527, 5.247998237609863, 5.733950614929199, 6.219902992248535, 6.705855369567871, 7.191807746887207, 7.677760124206543, 8.163712501525879, 8.649665832519531, 9.135618209838867, 9.621570587158203, 10.107522964477539, 10.593475341796875, 11.079427719116211, 11.565380096435547, 12.051332473754883, 12.537284851074219, 13.023237228393555, 13.50918960571289, 13.995141983032227, 14.481094360351562, 14.967046737670898, 15.452999114990234, 15.93895149230957, 16.424903869628906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 10.0, 9.0, 18.0, 20.0, 25.0, 42.0, 59.0, 106.0, 160.0, 268.0, 421.0, 673.0, 1222.0, 2182.0, 3908.0, 7873.0, 15596.0, 33879.0, 79159.0, 193539.0, 467762.0, 960540.0, 1181459.0, 715037.0, 309408.0, 123302.0, 51089.0, 22632.0, 10950.0, 5566.0, 2926.0, 1725.0, 947.0, 616.0, 389.0, 225.0, 163.0, 114.0, 62.0, 60.0, 36.0, 23.0, 26.0, 16.0, 8.0, 9.0, 7.0, 3.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4501953125, -1.3949737548828125, -1.339752197265625, -1.2845306396484375, -1.22930908203125, -1.1740875244140625, -1.118865966796875, -1.0636444091796875, -1.0084228515625, -0.9532012939453125, -0.897979736328125, -0.8427581787109375, -0.78753662109375, -0.7323150634765625, -0.677093505859375, -0.6218719482421875, -0.566650390625, -0.5114288330078125, -0.456207275390625, -0.4009857177734375, -0.34576416015625, -0.2905426025390625, -0.235321044921875, -0.1800994873046875, -0.1248779296875, -0.0696563720703125, -0.014434814453125, 0.0407867431640625, 0.09600830078125, 0.1512298583984375, 0.206451416015625, 0.2616729736328125, 0.31689453125, 0.3721160888671875, 0.427337646484375, 0.4825592041015625, 0.53778076171875, 0.5930023193359375, 0.648223876953125, 0.7034454345703125, 0.7586669921875, 0.8138885498046875, 0.869110107421875, 0.9243316650390625, 0.97955322265625, 1.0347747802734375, 1.089996337890625, 1.1452178955078125, 1.200439453125, 1.2556610107421875, 1.310882568359375, 1.3661041259765625, 1.42132568359375, 1.4765472412109375, 1.531768798828125, 1.5869903564453125, 1.6422119140625, 1.6974334716796875, 1.752655029296875, 1.8078765869140625, 1.86309814453125, 1.9183197021484375, 1.973541259765625, 2.0287628173828125, 2.083984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 10.0, 10.0, 7.0, 14.0, 16.0, 17.0, 28.0, 28.0, 27.0, 27.0, 47.0, 33.0, 51.0, 41.0, 50.0, 44.0, 56.0, 49.0, 39.0, 42.0, 41.0, 44.0, 36.0, 34.0, 29.0, 28.0, 19.0, 26.0, 19.0, 16.0, 14.0, 12.0, 8.0, 5.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.302734375, -2.230224609375, -2.15771484375, -2.085205078125, -2.0126953125, -1.940185546875, -1.86767578125, -1.795166015625, -1.72265625, -1.650146484375, -1.57763671875, -1.505126953125, -1.4326171875, -1.360107421875, -1.28759765625, -1.215087890625, -1.142578125, -1.070068359375, -0.99755859375, -0.925048828125, -0.8525390625, -0.780029296875, -0.70751953125, -0.635009765625, -0.5625, -0.489990234375, -0.41748046875, -0.344970703125, -0.2724609375, -0.199951171875, -0.12744140625, -0.054931640625, 0.017578125, 0.090087890625, 0.16259765625, 0.235107421875, 0.3076171875, 0.380126953125, 0.45263671875, 0.525146484375, 0.59765625, 0.670166015625, 0.74267578125, 0.815185546875, 0.8876953125, 0.960205078125, 1.03271484375, 1.105224609375, 1.177734375, 1.250244140625, 1.32275390625, 1.395263671875, 1.4677734375, 1.540283203125, 1.61279296875, 1.685302734375, 1.7578125, 1.830322265625, 1.90283203125, 1.975341796875, 2.0478515625, 2.120361328125, 2.19287109375, 2.265380859375, 2.337890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 10.0, 7.0, 17.0, 15.0, 31.0, 35.0, 39.0, 71.0, 116.0, 144.0, 254.0, 401.0, 634.0, 1205.0, 2285.0, 4702.0, 10487.0, 26513.0, 74996.0, 244695.0, 1015922.0, 1997200.0, 575616.0, 154650.0, 50058.0, 18545.0, 7740.0, 3573.0, 1802.0, 998.0, 558.0, 322.0, 222.0, 129.0, 82.0, 54.0, 36.0, 26.0, 24.0, 14.0, 11.0, 13.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-3.130859375, -3.03961181640625, -2.9483642578125, -2.85711669921875, -2.765869140625, -2.67462158203125, -2.5833740234375, -2.49212646484375, -2.40087890625, -2.30963134765625, -2.2183837890625, -2.12713623046875, -2.035888671875, -1.94464111328125, -1.8533935546875, -1.76214599609375, -1.6708984375, -1.57965087890625, -1.4884033203125, -1.39715576171875, -1.305908203125, -1.21466064453125, -1.1234130859375, -1.03216552734375, -0.94091796875, -0.84967041015625, -0.7584228515625, -0.66717529296875, -0.575927734375, -0.48468017578125, -0.3934326171875, -0.30218505859375, -0.2109375, -0.11968994140625, -0.0284423828125, 0.06280517578125, 0.154052734375, 0.24530029296875, 0.3365478515625, 0.42779541015625, 0.51904296875, 0.61029052734375, 0.7015380859375, 0.79278564453125, 0.884033203125, 0.97528076171875, 1.0665283203125, 1.15777587890625, 1.2490234375, 1.34027099609375, 1.4315185546875, 1.52276611328125, 1.614013671875, 1.70526123046875, 1.7965087890625, 1.88775634765625, 1.97900390625, 2.07025146484375, 2.1614990234375, 2.25274658203125, 2.343994140625, 2.43524169921875, 2.5264892578125, 2.61773681640625, 2.708984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 19.0, 22.0, 25.0, 35.0, 30.0, 43.0, 69.0, 102.0, 162.0, 189.0, 299.0, 390.0, 530.0, 559.0, 454.0, 308.0, 245.0, 158.0, 109.0, 54.0, 56.0, 53.0, 26.0, 29.0, 13.0, 21.0, 14.0, 4.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.6953125, -3.57666015625, -3.4580078125, -3.33935546875, -3.220703125, -3.10205078125, -2.9833984375, -2.86474609375, -2.74609375, -2.62744140625, -2.5087890625, -2.39013671875, -2.271484375, -2.15283203125, -2.0341796875, -1.91552734375, -1.796875, -1.67822265625, -1.5595703125, -1.44091796875, -1.322265625, -1.20361328125, -1.0849609375, -0.96630859375, -0.84765625, -0.72900390625, -0.6103515625, -0.49169921875, -0.373046875, -0.25439453125, -0.1357421875, -0.01708984375, 0.1015625, 0.22021484375, 0.3388671875, 0.45751953125, 0.576171875, 0.69482421875, 0.8134765625, 0.93212890625, 1.05078125, 1.16943359375, 1.2880859375, 1.40673828125, 1.525390625, 1.64404296875, 1.7626953125, 1.88134765625, 2.0, 2.11865234375, 2.2373046875, 2.35595703125, 2.474609375, 2.59326171875, 2.7119140625, 2.83056640625, 2.94921875, 3.06787109375, 3.1865234375, 3.30517578125, 3.423828125, 3.54248046875, 3.6611328125, 3.77978515625, 3.8984375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 31.0, 119.0, 229.0, 303.0, 199.0, 73.0, 24.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.60888671875, -66.94815063476562, -65.28742218017578, -63.626686096191406, -61.96595001220703, -60.30521774291992, -58.64448547363281, -56.98374938964844, -55.32301330566406, -53.66228103637695, -52.00154495239258, -50.34081268310547, -48.680076599121094, -47.019344329833984, -45.358612060546875, -43.6978759765625, -42.03714370727539, -40.37641143798828, -38.715675354003906, -37.0549430847168, -35.39420700073242, -33.73347473144531, -32.07273864746094, -30.412006378173828, -28.751272201538086, -27.090538024902344, -25.4298038482666, -23.76906967163086, -22.10833740234375, -20.447601318359375, -18.786869049072266, -17.126134872436523, -15.465404510498047, -13.804670333862305, -12.143936157226562, -10.483202934265137, -8.822468757629395, -7.161734580993652, -5.501001358032227, -3.8402671813964844, -2.179533004760742, -0.5187990665435791, 1.141934871673584, 2.802668571472168, 4.46340274810791, 6.124136924743652, 7.784870147705078, 9.44560432434082, 11.106338500976562, 12.767072677612305, 14.427806854248047, 16.088539123535156, 17.74927520751953, 19.41000747680664, 21.070741653442383, 22.731475830078125, 24.392210006713867, 26.05294418334961, 27.71367835998535, 29.374412536621094, 31.035144805908203, 32.69588088989258, 34.35661315917969, 36.01734924316406, 37.67808151245117]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 11.0, 13.0, 17.0, 17.0, 23.0, 17.0, 27.0, 25.0, 30.0, 39.0, 32.0, 61.0, 45.0, 38.0, 41.0, 39.0, 49.0, 57.0, 49.0, 47.0, 38.0, 34.0, 43.0, 25.0, 28.0, 40.0, 21.0, 14.0, 13.0, 6.0, 9.0, 10.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.223922729492188, -14.78917407989502, -14.354426383972168, -13.919677734375, -13.484930038452148, -13.05018138885498, -12.615432739257812, -12.180685043334961, -11.74593734741211, -11.311188697814941, -10.87644100189209, -10.441692352294922, -10.00694465637207, -9.572196006774902, -9.137447357177734, -8.702699661254883, -8.267951011657715, -7.833202838897705, -7.398454666137695, -6.963706016540527, -6.528958320617676, -6.094209671020508, -5.659461498260498, -5.224713325500488, -4.7899651527404785, -4.355216979980469, -3.920468807220459, -3.48572039604187, -3.0509722232818604, -2.6162240505218506, -2.1814756393432617, -1.746727466583252, -1.3119792938232422, -0.8772310614585876, -0.4424828290939331, -0.007734537124633789, 0.427013635635376, 0.8617618083953857, 1.2965102195739746, 1.7312583923339844, 2.166006565093994, 2.600754737854004, 3.0355029106140137, 3.4702513217926025, 3.9049994945526123, 4.339747428894043, 4.774496078491211, 5.209244251251221, 5.6439924240112305, 6.07874059677124, 6.51348876953125, 6.948237419128418, 7.3829851150512695, 7.8177337646484375, 8.252481460571289, 8.687230110168457, 9.121978759765625, 9.556727409362793, 9.991475105285645, 10.426223754882812, 10.860971450805664, 11.295720100402832, 11.73046875, 12.165216445922852, 12.599964141845703]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 9.0, 10.0, 11.0, 22.0, 42.0, 43.0, 94.0, 207.0, 381.0, 693.0, 1352.0, 2537.0, 4841.0, 9356.0, 21045.0, 63905.0, 228765.0, 407995.0, 210596.0, 58439.0, 19435.0, 9038.0, 4554.0, 2450.0, 1254.0, 700.0, 349.0, 182.0, 98.0, 55.0, 36.0, 29.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.9901123046875, -3.859130859375, -3.7281494140625, -3.59716796875, -3.4661865234375, -3.335205078125, -3.2042236328125, -3.0732421875, -2.9422607421875, -2.811279296875, -2.6802978515625, -2.54931640625, -2.4183349609375, -2.287353515625, -2.1563720703125, -2.025390625, -1.8944091796875, -1.763427734375, -1.6324462890625, -1.50146484375, -1.3704833984375, -1.239501953125, -1.1085205078125, -0.9775390625, -0.8465576171875, -0.715576171875, -0.5845947265625, -0.45361328125, -0.3226318359375, -0.191650390625, -0.0606689453125, 0.0703125, 0.2012939453125, 0.332275390625, 0.4632568359375, 0.59423828125, 0.7252197265625, 0.856201171875, 0.9871826171875, 1.1181640625, 1.2491455078125, 1.380126953125, 1.5111083984375, 1.64208984375, 1.7730712890625, 1.904052734375, 2.0350341796875, 2.166015625, 2.2969970703125, 2.427978515625, 2.5589599609375, 2.68994140625, 2.8209228515625, 2.951904296875, 3.0828857421875, 3.2138671875, 3.3448486328125, 3.475830078125, 3.6068115234375, 3.73779296875, 3.8687744140625, 3.999755859375, 4.1307373046875, 4.26171875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 10.0, 14.0, 12.0, 21.0, 31.0, 28.0, 26.0, 29.0, 29.0, 29.0, 32.0, 35.0, 38.0, 49.0, 50.0, 45.0, 47.0, 41.0, 49.0, 29.0, 39.0, 34.0, 32.0, 37.0, 33.0, 24.0, 16.0, 25.0, 24.0, 8.0, 11.0, 10.0, 12.0, 6.0, 8.0, 2.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.17578125, -2.105377197265625, -2.03497314453125, -1.964569091796875, -1.8941650390625, -1.823760986328125, -1.75335693359375, -1.682952880859375, -1.612548828125, -1.542144775390625, -1.47174072265625, -1.401336669921875, -1.3309326171875, -1.260528564453125, -1.19012451171875, -1.119720458984375, -1.04931640625, -0.978912353515625, -0.90850830078125, -0.838104248046875, -0.7677001953125, -0.697296142578125, -0.62689208984375, -0.556488037109375, -0.486083984375, -0.415679931640625, -0.34527587890625, -0.274871826171875, -0.2044677734375, -0.134063720703125, -0.06365966796875, 0.006744384765625, 0.0771484375, 0.147552490234375, 0.21795654296875, 0.288360595703125, 0.3587646484375, 0.429168701171875, 0.49957275390625, 0.569976806640625, 0.640380859375, 0.710784912109375, 0.78118896484375, 0.851593017578125, 0.9219970703125, 0.992401123046875, 1.06280517578125, 1.133209228515625, 1.20361328125, 1.274017333984375, 1.34442138671875, 1.414825439453125, 1.4852294921875, 1.555633544921875, 1.62603759765625, 1.696441650390625, 1.766845703125, 1.837249755859375, 1.90765380859375, 1.978057861328125, 2.0484619140625, 2.118865966796875, 2.18927001953125, 2.259674072265625, 2.330078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 14.0, 21.0, 23.0, 42.0, 33.0, 77.0, 92.0, 146.0, 232.0, 356.0, 620.0, 1014.0, 1818.0, 3076.0, 5663.0, 10668.0, 21017.0, 47880.0, 119823.0, 265087.0, 299836.0, 155660.0, 60941.0, 26018.0, 12756.0, 6658.0, 3779.0, 2141.0, 1192.0, 675.0, 430.0, 237.0, 155.0, 108.0, 67.0, 54.0, 33.0, 25.0, 25.0, 11.0, 10.0, 6.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.150390625, -3.055328369140625, -2.96026611328125, -2.865203857421875, -2.7701416015625, -2.675079345703125, -2.58001708984375, -2.484954833984375, -2.389892578125, -2.294830322265625, -2.19976806640625, -2.104705810546875, -2.0096435546875, -1.914581298828125, -1.81951904296875, -1.724456787109375, -1.62939453125, -1.534332275390625, -1.43927001953125, -1.344207763671875, -1.2491455078125, -1.154083251953125, -1.05902099609375, -0.963958740234375, -0.868896484375, -0.773834228515625, -0.67877197265625, -0.583709716796875, -0.4886474609375, -0.393585205078125, -0.29852294921875, -0.203460693359375, -0.1083984375, -0.013336181640625, 0.08172607421875, 0.176788330078125, 0.2718505859375, 0.366912841796875, 0.46197509765625, 0.557037353515625, 0.652099609375, 0.747161865234375, 0.84222412109375, 0.937286376953125, 1.0323486328125, 1.127410888671875, 1.22247314453125, 1.317535400390625, 1.41259765625, 1.507659912109375, 1.60272216796875, 1.697784423828125, 1.7928466796875, 1.887908935546875, 1.98297119140625, 2.078033447265625, 2.173095703125, 2.268157958984375, 2.36322021484375, 2.458282470703125, 2.5533447265625, 2.648406982421875, 2.74346923828125, 2.838531494140625, 2.93359375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 7.0, 3.0, 4.0, 7.0, 8.0, 8.0, 9.0, 9.0, 14.0, 18.0, 12.0, 14.0, 16.0, 31.0, 21.0, 22.0, 25.0, 23.0, 38.0, 31.0, 35.0, 32.0, 38.0, 38.0, 42.0, 35.0, 37.0, 45.0, 34.0, 28.0, 35.0, 30.0, 30.0, 30.0, 17.0, 16.0, 34.0, 15.0, 16.0, 10.0, 9.0, 15.0, 10.0, 8.0, 9.0, 7.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 4.0, 4.0], "bins": [-6.09375, -5.91748046875, -5.7412109375, -5.56494140625, -5.388671875, -5.21240234375, -5.0361328125, -4.85986328125, -4.68359375, -4.50732421875, -4.3310546875, -4.15478515625, -3.978515625, -3.80224609375, -3.6259765625, -3.44970703125, -3.2734375, -3.09716796875, -2.9208984375, -2.74462890625, -2.568359375, -2.39208984375, -2.2158203125, -2.03955078125, -1.86328125, -1.68701171875, -1.5107421875, -1.33447265625, -1.158203125, -0.98193359375, -0.8056640625, -0.62939453125, -0.453125, -0.27685546875, -0.1005859375, 0.07568359375, 0.251953125, 0.42822265625, 0.6044921875, 0.78076171875, 0.95703125, 1.13330078125, 1.3095703125, 1.48583984375, 1.662109375, 1.83837890625, 2.0146484375, 2.19091796875, 2.3671875, 2.54345703125, 2.7197265625, 2.89599609375, 3.072265625, 3.24853515625, 3.4248046875, 3.60107421875, 3.77734375, 3.95361328125, 4.1298828125, 4.30615234375, 4.482421875, 4.65869140625, 4.8349609375, 5.01123046875, 5.1875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 6.0, 10.0, 5.0, 5.0, 10.0, 19.0, 30.0, 36.0, 57.0, 66.0, 100.0, 153.0, 222.0, 284.0, 434.0, 648.0, 989.0, 1558.0, 2592.0, 4118.0, 6990.0, 12902.0, 24570.0, 49570.0, 112856.0, 229507.0, 277342.0, 169370.0, 76723.0, 35485.0, 17837.0, 9621.0, 5572.0, 3185.0, 1900.0, 1247.0, 839.0, 521.0, 369.0, 285.0, 164.0, 108.0, 87.0, 63.0, 26.0, 24.0, 23.0, 14.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.89501953125, -0.8644332885742188, -0.8338470458984375, -0.8032608032226562, -0.772674560546875, -0.7420883178710938, -0.7115020751953125, -0.6809158325195312, -0.65032958984375, -0.6197433471679688, -0.5891571044921875, -0.5585708618164062, -0.527984619140625, -0.49739837646484375, -0.4668121337890625, -0.43622589111328125, -0.4056396484375, -0.37505340576171875, -0.3444671630859375, -0.31388092041015625, -0.283294677734375, -0.25270843505859375, -0.2221221923828125, -0.19153594970703125, -0.16094970703125, -0.13036346435546875, -0.0997772216796875, -0.06919097900390625, -0.038604736328125, -0.00801849365234375, 0.0225677490234375, 0.05315399169921875, 0.083740234375, 0.11432647705078125, 0.1449127197265625, 0.17549896240234375, 0.206085205078125, 0.23667144775390625, 0.2672576904296875, 0.29784393310546875, 0.32843017578125, 0.35901641845703125, 0.3896026611328125, 0.42018890380859375, 0.450775146484375, 0.48136138916015625, 0.5119476318359375, 0.5425338745117188, 0.5731201171875, 0.6037063598632812, 0.6342926025390625, 0.6648788452148438, 0.695465087890625, 0.7260513305664062, 0.7566375732421875, 0.7872238159179688, 0.81781005859375, 0.8483963012695312, 0.8789825439453125, 0.9095687866210938, 0.940155029296875, 0.9707412719726562, 1.0013275146484375, 1.0319137573242188, 1.0625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 7.0, 3.0, 9.0, 11.0, 15.0, 18.0, 29.0, 51.0, 49.0, 83.0, 102.0, 122.0, 99.0, 103.0, 80.0, 62.0, 38.0, 19.0, 26.0, 10.0, 8.0, 6.0, 9.0, 9.0, 4.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003757476806640625, -0.0003598928451538086, -0.0003440380096435547, -0.0003281831741333008, -0.0003123283386230469, -0.00029647350311279297, -0.00028061866760253906, -0.00026476383209228516, -0.00024890899658203125, -0.00023305416107177734, -0.00021719932556152344, -0.00020134449005126953, -0.00018548965454101562, -0.00016963481903076172, -0.0001537799835205078, -0.0001379251480102539, -0.0001220703125, -0.0001062154769897461, -9.036064147949219e-05, -7.450580596923828e-05, -5.8650970458984375e-05, -4.279613494873047e-05, -2.6941299438476562e-05, -1.1086463928222656e-05, 4.76837158203125e-06, 2.0623207092285156e-05, 3.647804260253906e-05, 5.233287811279297e-05, 6.818771362304688e-05, 8.404254913330078e-05, 9.989738464355469e-05, 0.0001157522201538086, 0.0001316070556640625, 0.0001474618911743164, 0.0001633167266845703, 0.00017917156219482422, 0.00019502639770507812, 0.00021088123321533203, 0.00022673606872558594, 0.00024259090423583984, 0.00025844573974609375, 0.00027430057525634766, 0.00029015541076660156, 0.00030601024627685547, 0.0003218650817871094, 0.0003377199172973633, 0.0003535747528076172, 0.0003694295883178711, 0.000385284423828125, 0.0004011392593383789, 0.0004169940948486328, 0.0004328489303588867, 0.0004487037658691406, 0.00046455860137939453, 0.00048041343688964844, 0.0004962682723999023, 0.0005121231079101562, 0.0005279779434204102, 0.0005438327789306641, 0.000559687614440918, 0.0005755424499511719, 0.0005913972854614258, 0.0006072521209716797, 0.0006231069564819336, 0.0006389617919921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 10.0, 12.0, 13.0, 32.0, 44.0, 101.0, 159.0, 274.0, 533.0, 1101.0, 2331.0, 5823.0, 15764.0, 49342.0, 158977.0, 356844.0, 296839.0, 108467.0, 33001.0, 11146.0, 4282.0, 1732.0, 846.0, 379.0, 202.0, 105.0, 83.0, 38.0, 21.0, 20.0, 11.0, 2.0, 7.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5078125, -1.4645233154296875, -1.421234130859375, -1.3779449462890625, -1.33465576171875, -1.2913665771484375, -1.248077392578125, -1.2047882080078125, -1.1614990234375, -1.1182098388671875, -1.074920654296875, -1.0316314697265625, -0.98834228515625, -0.9450531005859375, -0.901763916015625, -0.8584747314453125, -0.815185546875, -0.7718963623046875, -0.728607177734375, -0.6853179931640625, -0.64202880859375, -0.5987396240234375, -0.555450439453125, -0.5121612548828125, -0.4688720703125, -0.4255828857421875, -0.382293701171875, -0.3390045166015625, -0.29571533203125, -0.2524261474609375, -0.209136962890625, -0.1658477783203125, -0.12255859375, -0.0792694091796875, -0.035980224609375, 0.0073089599609375, 0.05059814453125, 0.0938873291015625, 0.137176513671875, 0.1804656982421875, 0.2237548828125, 0.2670440673828125, 0.310333251953125, 0.3536224365234375, 0.39691162109375, 0.4402008056640625, 0.483489990234375, 0.5267791748046875, 0.570068359375, 0.6133575439453125, 0.656646728515625, 0.6999359130859375, 0.74322509765625, 0.7865142822265625, 0.829803466796875, 0.8730926513671875, 0.9163818359375, 0.9596710205078125, 1.002960205078125, 1.0462493896484375, 1.08953857421875, 1.1328277587890625, 1.176116943359375, 1.2194061279296875, 1.2626953125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 5.0, 5.0, 9.0, 6.0, 19.0, 20.0, 19.0, 32.0, 44.0, 34.0, 63.0, 68.0, 72.0, 75.0, 81.0, 60.0, 61.0, 53.0, 56.0, 39.0, 31.0, 33.0, 26.0, 26.0, 21.0, 9.0, 5.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.360076904296875, -1.31195068359375, -1.263824462890625, -1.2156982421875, -1.167572021484375, -1.11944580078125, -1.071319580078125, -1.023193359375, -0.975067138671875, -0.92694091796875, -0.878814697265625, -0.8306884765625, -0.782562255859375, -0.73443603515625, -0.686309814453125, -0.63818359375, -0.590057373046875, -0.54193115234375, -0.493804931640625, -0.4456787109375, -0.397552490234375, -0.34942626953125, -0.301300048828125, -0.253173828125, -0.205047607421875, -0.15692138671875, -0.108795166015625, -0.0606689453125, -0.012542724609375, 0.03558349609375, 0.083709716796875, 0.1318359375, 0.179962158203125, 0.22808837890625, 0.276214599609375, 0.3243408203125, 0.372467041015625, 0.42059326171875, 0.468719482421875, 0.516845703125, 0.564971923828125, 0.61309814453125, 0.661224365234375, 0.7093505859375, 0.757476806640625, 0.80560302734375, 0.853729248046875, 0.90185546875, 0.949981689453125, 0.99810791015625, 1.046234130859375, 1.0943603515625, 1.142486572265625, 1.19061279296875, 1.238739013671875, 1.286865234375, 1.334991455078125, 1.38311767578125, 1.431243896484375, 1.4793701171875, 1.527496337890625, 1.57562255859375, 1.623748779296875, 1.671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 28.0, 71.0, 135.0, 185.0, 208.0, 144.0, 100.0, 47.0, 29.0, 18.0, 6.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.418155670166016, -18.450836181640625, -17.483516693115234, -16.516197204589844, -15.54887866973877, -14.581559181213379, -13.614239692687988, -12.646921157836914, -11.679601669311523, -10.712282180786133, -9.744962692260742, -8.777643203735352, -7.810324668884277, -6.843005180358887, -5.875685691833496, -4.908366680145264, -3.941046714782715, -2.9737274646759033, -2.006408214569092, -1.0390887260437012, -0.07176947593688965, 0.8955497741699219, 1.8628692626953125, 2.830188274383545, 3.7975077629089355, 4.764827251434326, 5.732146263122559, 6.699465751647949, 7.66678524017334, 8.634103775024414, 9.601423263549805, 10.568742752075195, 11.536062240600586, 12.503381729125977, 13.470701217651367, 14.438020706176758, 15.405339241027832, 16.372657775878906, 17.339977264404297, 18.307296752929688, 19.274616241455078, 20.24193572998047, 21.20925521850586, 22.17657470703125, 23.14389419555664, 24.11121368408203, 25.078533172607422, 26.04585075378418, 27.013172149658203, 27.980491638183594, 28.947811126708984, 29.915130615234375, 30.882450103759766, 31.849769592285156, 32.81708908081055, 33.78440856933594, 34.75172424316406, 35.71904373168945, 36.686363220214844, 37.653682708740234, 38.621002197265625, 39.588321685791016, 40.555641174316406, 41.5229606628418, 42.49028015136719]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 6.0, 6.0, 4.0, 4.0, 6.0, 6.0, 16.0, 14.0, 16.0, 18.0, 24.0, 31.0, 37.0, 29.0, 43.0, 35.0, 35.0, 47.0, 50.0, 49.0, 42.0, 43.0, 39.0, 44.0, 43.0, 45.0, 35.0, 37.0, 34.0, 31.0, 25.0, 19.0, 18.0, 20.0, 10.0, 15.0, 6.0, 12.0, 5.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.74022102355957, -17.246177673339844, -16.752134323120117, -16.258092880249023, -15.764049530029297, -15.27000617980957, -14.775962829589844, -14.281919479370117, -13.787877082824707, -13.29383373260498, -12.79979133605957, -12.305747985839844, -11.811704635620117, -11.317662239074707, -10.82361888885498, -10.32957649230957, -9.835533142089844, -9.341489791870117, -8.847447395324707, -8.35340404510498, -7.859361171722412, -7.365318298339844, -6.871274948120117, -6.377232074737549, -5.8831892013549805, -5.389146327972412, -4.895103454589844, -4.401060104370117, -3.907017230987549, -3.4129743576049805, -2.918931245803833, -2.4248881340026855, -1.9308443069458008, -1.4368013143539429, -0.942758321762085, -0.44871532917022705, 0.04532766342163086, 0.5393705368041992, 1.0334136486053467, 1.5274567604064941, 2.0214996337890625, 2.515542507171631, 3.0095856189727783, 3.503628730773926, 3.997671604156494, 4.4917144775390625, 4.985757827758789, 5.479800701141357, 5.973843574523926, 6.467886447906494, 6.9619293212890625, 7.455972671508789, 7.950015544891357, 8.444058418273926, 8.938101768493652, 9.432144165039062, 9.926187515258789, 10.420230865478516, 10.914273262023926, 11.408316612243652, 11.902359008789062, 12.396402359008789, 12.890445709228516, 13.384489059448242, 13.878531455993652]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 8.0, 14.0, 21.0, 33.0, 59.0, 131.0, 190.0, 390.0, 813.0, 1660.0, 3683.0, 8827.0, 24073.0, 74142.0, 258599.0, 771657.0, 1431802.0, 1054074.0, 397042.0, 113718.0, 33083.0, 11424.0, 4588.0, 2065.0, 984.0, 502.0, 262.0, 152.0, 90.0, 58.0, 47.0, 30.0, 14.0, 16.0, 13.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9287109375, -1.8536224365234375, -1.778533935546875, -1.7034454345703125, -1.62835693359375, -1.5532684326171875, -1.478179931640625, -1.4030914306640625, -1.3280029296875, -1.2529144287109375, -1.177825927734375, -1.1027374267578125, -1.02764892578125, -0.9525604248046875, -0.877471923828125, -0.8023834228515625, -0.727294921875, -0.6522064208984375, -0.577117919921875, -0.5020294189453125, -0.42694091796875, -0.3518524169921875, -0.276763916015625, -0.2016754150390625, -0.1265869140625, -0.0514984130859375, 0.023590087890625, 0.0986785888671875, 0.17376708984375, 0.2488555908203125, 0.323944091796875, 0.3990325927734375, 0.47412109375, 0.5492095947265625, 0.624298095703125, 0.6993865966796875, 0.77447509765625, 0.8495635986328125, 0.924652099609375, 0.9997406005859375, 1.0748291015625, 1.1499176025390625, 1.225006103515625, 1.3000946044921875, 1.37518310546875, 1.4502716064453125, 1.525360107421875, 1.6004486083984375, 1.675537109375, 1.7506256103515625, 1.825714111328125, 1.9008026123046875, 1.97589111328125, 2.0509796142578125, 2.126068115234375, 2.2011566162109375, 2.2762451171875, 2.3513336181640625, 2.426422119140625, 2.5015106201171875, 2.57659912109375, 2.6516876220703125, 2.726776123046875, 2.8018646240234375, 2.876953125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 3.0, 12.0, 9.0, 8.0, 7.0, 17.0, 19.0, 17.0, 21.0, 23.0, 28.0, 28.0, 30.0, 26.0, 33.0, 52.0, 41.0, 47.0, 40.0, 42.0, 40.0, 42.0, 49.0, 35.0, 36.0, 37.0, 32.0, 25.0, 22.0, 22.0, 21.0, 21.0, 18.0, 18.0, 14.0, 9.0, 15.0, 8.0, 4.0, 7.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.865234375, -1.797760009765625, -1.73028564453125, -1.662811279296875, -1.5953369140625, -1.527862548828125, -1.46038818359375, -1.392913818359375, -1.325439453125, -1.257965087890625, -1.19049072265625, -1.123016357421875, -1.0555419921875, -0.988067626953125, -0.92059326171875, -0.853118896484375, -0.78564453125, -0.718170166015625, -0.65069580078125, -0.583221435546875, -0.5157470703125, -0.448272705078125, -0.38079833984375, -0.313323974609375, -0.245849609375, -0.178375244140625, -0.11090087890625, -0.043426513671875, 0.0240478515625, 0.091522216796875, 0.15899658203125, 0.226470947265625, 0.2939453125, 0.361419677734375, 0.42889404296875, 0.496368408203125, 0.5638427734375, 0.631317138671875, 0.69879150390625, 0.766265869140625, 0.833740234375, 0.901214599609375, 0.96868896484375, 1.036163330078125, 1.1036376953125, 1.171112060546875, 1.23858642578125, 1.306060791015625, 1.37353515625, 1.441009521484375, 1.50848388671875, 1.575958251953125, 1.6434326171875, 1.710906982421875, 1.77838134765625, 1.845855712890625, 1.913330078125, 1.980804443359375, 2.04827880859375, 2.115753173828125, 2.1832275390625, 2.250701904296875, 2.31817626953125, 2.385650634765625, 2.453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 9.0, 6.0, 13.0, 13.0, 17.0, 32.0, 45.0, 50.0, 103.0, 135.0, 251.0, 405.0, 722.0, 1261.0, 2353.0, 4648.0, 9595.0, 21962.0, 54348.0, 151200.0, 484775.0, 1564779.0, 1313591.0, 379568.0, 123105.0, 45457.0, 18466.0, 8477.0, 4056.0, 2046.0, 1148.0, 623.0, 327.0, 239.0, 181.0, 108.0, 66.0, 33.0, 19.0, 19.0, 9.0, 9.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.544921875, -2.46514892578125, -2.3853759765625, -2.30560302734375, -2.225830078125, -2.14605712890625, -2.0662841796875, -1.98651123046875, -1.90673828125, -1.82696533203125, -1.7471923828125, -1.66741943359375, -1.587646484375, -1.50787353515625, -1.4281005859375, -1.34832763671875, -1.2685546875, -1.18878173828125, -1.1090087890625, -1.02923583984375, -0.949462890625, -0.86968994140625, -0.7899169921875, -0.71014404296875, -0.63037109375, -0.55059814453125, -0.4708251953125, -0.39105224609375, -0.311279296875, -0.23150634765625, -0.1517333984375, -0.07196044921875, 0.0078125, 0.08758544921875, 0.1673583984375, 0.24713134765625, 0.326904296875, 0.40667724609375, 0.4864501953125, 0.56622314453125, 0.64599609375, 0.72576904296875, 0.8055419921875, 0.88531494140625, 0.965087890625, 1.04486083984375, 1.1246337890625, 1.20440673828125, 1.2841796875, 1.36395263671875, 1.4437255859375, 1.52349853515625, 1.603271484375, 1.68304443359375, 1.7628173828125, 1.84259033203125, 1.92236328125, 2.00213623046875, 2.0819091796875, 2.16168212890625, 2.241455078125, 2.32122802734375, 2.4010009765625, 2.48077392578125, 2.560546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 8.0, 5.0, 4.0, 11.0, 14.0, 24.0, 18.0, 37.0, 42.0, 58.0, 74.0, 79.0, 120.0, 158.0, 204.0, 268.0, 365.0, 448.0, 439.0, 368.0, 315.0, 254.0, 202.0, 127.0, 105.0, 80.0, 58.0, 46.0, 29.0, 28.0, 23.0, 16.0, 12.0, 8.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.884765625, -3.77752685546875, -3.6702880859375, -3.56304931640625, -3.455810546875, -3.34857177734375, -3.2413330078125, -3.13409423828125, -3.02685546875, -2.91961669921875, -2.8123779296875, -2.70513916015625, -2.597900390625, -2.49066162109375, -2.3834228515625, -2.27618408203125, -2.1689453125, -2.06170654296875, -1.9544677734375, -1.84722900390625, -1.739990234375, -1.63275146484375, -1.5255126953125, -1.41827392578125, -1.31103515625, -1.20379638671875, -1.0965576171875, -0.98931884765625, -0.882080078125, -0.77484130859375, -0.6676025390625, -0.56036376953125, -0.453125, -0.34588623046875, -0.2386474609375, -0.13140869140625, -0.024169921875, 0.08306884765625, 0.1903076171875, 0.29754638671875, 0.40478515625, 0.51202392578125, 0.6192626953125, 0.72650146484375, 0.833740234375, 0.94097900390625, 1.0482177734375, 1.15545654296875, 1.2626953125, 1.36993408203125, 1.4771728515625, 1.58441162109375, 1.691650390625, 1.79888916015625, 1.9061279296875, 2.01336669921875, 2.12060546875, 2.22784423828125, 2.3350830078125, 2.44232177734375, 2.549560546875, 2.65679931640625, 2.7640380859375, 2.87127685546875, 2.978515625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 13.0, 24.0, 88.0, 188.0, 261.0, 229.0, 109.0, 48.0, 21.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.3680419921875, -44.945560455322266, -43.5230827331543, -42.10060119628906, -40.678123474121094, -39.25564193725586, -37.833160400390625, -36.410682678222656, -34.98820114135742, -33.56571960449219, -32.14324188232422, -30.720760345458984, -29.298280715942383, -27.87580108642578, -26.453319549560547, -25.030839920043945, -23.608360290527344, -22.185880661010742, -20.76340103149414, -19.340919494628906, -17.918439865112305, -16.495960235595703, -15.073479652404785, -13.650999069213867, -12.228519439697266, -10.806039810180664, -9.383559226989746, -7.961079120635986, -6.538599014282227, -5.116118907928467, -3.693638801574707, -2.271158218383789, -0.8486747741699219, 0.5738053321838379, 1.9962854385375977, 3.4187655448913574, 4.841245651245117, 6.263725757598877, 7.686205863952637, 9.108686447143555, 10.531166076660156, 11.953645706176758, 13.376126289367676, 14.798606872558594, 16.221086502075195, 17.643566131591797, 19.06604766845703, 20.488527297973633, 21.911006927490234, 23.333486557006836, 24.755966186523438, 26.178447723388672, 27.600927352905273, 29.023406982421875, 30.44588851928711, 31.86836814880371, 33.29084777832031, 34.71332931518555, 36.135807037353516, 37.55828857421875, 38.98076629638672, 40.40324783325195, 41.82572937011719, 43.248207092285156, 44.67068862915039]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 7.0, 10.0, 14.0, 10.0, 10.0, 23.0, 20.0, 23.0, 25.0, 36.0, 37.0, 34.0, 32.0, 47.0, 39.0, 40.0, 50.0, 43.0, 57.0, 52.0, 56.0, 52.0, 37.0, 39.0, 34.0, 32.0, 24.0, 22.0, 18.0, 15.0, 12.0, 12.0, 7.0, 12.0, 3.0, 1.0, 3.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.33450984954834, -12.922429084777832, -12.51034927368164, -12.098268508911133, -11.686187744140625, -11.274106979370117, -10.862027168273926, -10.449946403503418, -10.037866592407227, -9.625785827636719, -9.213706016540527, -8.80162525177002, -8.389544486999512, -7.977464199066162, -7.5653839111328125, -7.153303146362305, -6.741222381591797, -6.329142093658447, -5.9170613288879395, -5.50498104095459, -5.092900276184082, -4.680819988250732, -4.268739700317383, -3.856659173965454, -3.4445786476135254, -3.0324981212615967, -2.620417594909668, -2.2083373069763184, -1.7962567806243896, -1.384176254272461, -0.9720959663391113, -0.5600154399871826, -0.1479339599609375, 0.26414650678634644, 0.6762269735336304, 1.0883073806762695, 1.5003879070281982, 1.912468433380127, 2.3245487213134766, 2.7366292476654053, 3.148709774017334, 3.5607903003692627, 3.9728708267211914, 4.384951114654541, 4.797031402587891, 5.209112167358398, 5.621192455291748, 6.033272743225098, 6.4453535079956055, 6.857433795928955, 7.269514560699463, 7.6815948486328125, 8.09367561340332, 8.505756378173828, 8.91783618927002, 9.329916954040527, 9.741996765136719, 10.154077529907227, 10.566157341003418, 10.978238105773926, 11.390318870544434, 11.802398681640625, 12.214479446411133, 12.62656021118164, 13.038640975952148]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 15.0, 29.0, 38.0, 51.0, 98.0, 137.0, 201.0, 325.0, 557.0, 909.0, 1655.0, 3010.0, 6151.0, 14299.0, 44420.0, 155341.0, 363700.0, 302166.0, 104035.0, 29976.0, 10813.0, 4814.0, 2395.0, 1377.0, 800.0, 483.0, 275.0, 180.0, 100.0, 65.0, 45.0, 31.0, 21.0, 12.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.373260498046875, -3.25628662109375, -3.139312744140625, -3.0223388671875, -2.905364990234375, -2.78839111328125, -2.671417236328125, -2.554443359375, -2.437469482421875, -2.32049560546875, -2.203521728515625, -2.0865478515625, -1.969573974609375, -1.85260009765625, -1.735626220703125, -1.61865234375, -1.501678466796875, -1.38470458984375, -1.267730712890625, -1.1507568359375, -1.033782958984375, -0.91680908203125, -0.799835205078125, -0.682861328125, -0.565887451171875, -0.44891357421875, -0.331939697265625, -0.2149658203125, -0.097991943359375, 0.01898193359375, 0.135955810546875, 0.2529296875, 0.369903564453125, 0.48687744140625, 0.603851318359375, 0.7208251953125, 0.837799072265625, 0.95477294921875, 1.071746826171875, 1.188720703125, 1.305694580078125, 1.42266845703125, 1.539642333984375, 1.6566162109375, 1.773590087890625, 1.89056396484375, 2.007537841796875, 2.12451171875, 2.241485595703125, 2.35845947265625, 2.475433349609375, 2.5924072265625, 2.709381103515625, 2.82635498046875, 2.943328857421875, 3.060302734375, 3.177276611328125, 3.29425048828125, 3.411224365234375, 3.5281982421875, 3.645172119140625, 3.76214599609375, 3.879119873046875, 3.99609375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 10.0, 7.0, 9.0, 8.0, 10.0, 15.0, 19.0, 14.0, 18.0, 25.0, 36.0, 28.0, 27.0, 29.0, 30.0, 45.0, 35.0, 40.0, 43.0, 46.0, 43.0, 50.0, 28.0, 35.0, 45.0, 35.0, 30.0, 22.0, 20.0, 21.0, 30.0, 13.0, 28.0, 13.0, 16.0, 14.0, 13.0, 8.0, 11.0, 5.0, 9.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.31640625, -2.24871826171875, -2.1810302734375, -2.11334228515625, -2.045654296875, -1.97796630859375, -1.9102783203125, -1.84259033203125, -1.77490234375, -1.70721435546875, -1.6395263671875, -1.57183837890625, -1.504150390625, -1.43646240234375, -1.3687744140625, -1.30108642578125, -1.2333984375, -1.16571044921875, -1.0980224609375, -1.03033447265625, -0.962646484375, -0.89495849609375, -0.8272705078125, -0.75958251953125, -0.69189453125, -0.62420654296875, -0.5565185546875, -0.48883056640625, -0.421142578125, -0.35345458984375, -0.2857666015625, -0.21807861328125, -0.150390625, -0.08270263671875, -0.0150146484375, 0.05267333984375, 0.120361328125, 0.18804931640625, 0.2557373046875, 0.32342529296875, 0.39111328125, 0.45880126953125, 0.5264892578125, 0.59417724609375, 0.661865234375, 0.72955322265625, 0.7972412109375, 0.86492919921875, 0.9326171875, 1.00030517578125, 1.0679931640625, 1.13568115234375, 1.203369140625, 1.27105712890625, 1.3387451171875, 1.40643310546875, 1.47412109375, 1.54180908203125, 1.6094970703125, 1.67718505859375, 1.744873046875, 1.81256103515625, 1.8802490234375, 1.94793701171875, 2.015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 12.0, 20.0, 32.0, 37.0, 66.0, 86.0, 142.0, 201.0, 446.0, 667.0, 1239.0, 2299.0, 4345.0, 8550.0, 18324.0, 45852.0, 125796.0, 282814.0, 308126.0, 151778.0, 55471.0, 21291.0, 10039.0, 4962.0, 2690.0, 1359.0, 776.0, 430.0, 272.0, 168.0, 85.0, 50.0, 40.0, 25.0, 21.0, 11.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.09765625, -3.004058837890625, -2.91046142578125, -2.816864013671875, -2.7232666015625, -2.629669189453125, -2.53607177734375, -2.442474365234375, -2.348876953125, -2.255279541015625, -2.16168212890625, -2.068084716796875, -1.9744873046875, -1.880889892578125, -1.78729248046875, -1.693695068359375, -1.60009765625, -1.506500244140625, -1.41290283203125, -1.319305419921875, -1.2257080078125, -1.132110595703125, -1.03851318359375, -0.944915771484375, -0.851318359375, -0.757720947265625, -0.66412353515625, -0.570526123046875, -0.4769287109375, -0.383331298828125, -0.28973388671875, -0.196136474609375, -0.1025390625, -0.008941650390625, 0.08465576171875, 0.178253173828125, 0.2718505859375, 0.365447998046875, 0.45904541015625, 0.552642822265625, 0.646240234375, 0.739837646484375, 0.83343505859375, 0.927032470703125, 1.0206298828125, 1.114227294921875, 1.20782470703125, 1.301422119140625, 1.39501953125, 1.488616943359375, 1.58221435546875, 1.675811767578125, 1.7694091796875, 1.863006591796875, 1.95660400390625, 2.050201416015625, 2.143798828125, 2.237396240234375, 2.33099365234375, 2.424591064453125, 2.5181884765625, 2.611785888671875, 2.70538330078125, 2.798980712890625, 2.892578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 14.0, 6.0, 10.0, 10.0, 20.0, 18.0, 26.0, 36.0, 33.0, 44.0, 55.0, 50.0, 45.0, 68.0, 65.0, 56.0, 57.0, 54.0, 61.0, 53.0, 38.0, 38.0, 23.0, 24.0, 27.0, 18.0, 19.0, 16.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.5078125, -10.23016357421875, -9.9525146484375, -9.67486572265625, -9.397216796875, -9.11956787109375, -8.8419189453125, -8.56427001953125, -8.28662109375, -8.00897216796875, -7.7313232421875, -7.45367431640625, -7.176025390625, -6.89837646484375, -6.6207275390625, -6.34307861328125, -6.0654296875, -5.78778076171875, -5.5101318359375, -5.23248291015625, -4.954833984375, -4.67718505859375, -4.3995361328125, -4.12188720703125, -3.84423828125, -3.56658935546875, -3.2889404296875, -3.01129150390625, -2.733642578125, -2.45599365234375, -2.1783447265625, -1.90069580078125, -1.623046875, -1.34539794921875, -1.0677490234375, -0.79010009765625, -0.512451171875, -0.23480224609375, 0.0428466796875, 0.32049560546875, 0.59814453125, 0.87579345703125, 1.1534423828125, 1.43109130859375, 1.708740234375, 1.98638916015625, 2.2640380859375, 2.54168701171875, 2.8193359375, 3.09698486328125, 3.3746337890625, 3.65228271484375, 3.929931640625, 4.20758056640625, 4.4852294921875, 4.76287841796875, 5.04052734375, 5.31817626953125, 5.5958251953125, 5.87347412109375, 6.151123046875, 6.42877197265625, 6.7064208984375, 6.98406982421875, 7.26171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 16.0, 17.0, 37.0, 33.0, 54.0, 87.0, 119.0, 175.0, 250.0, 427.0, 555.0, 856.0, 1279.0, 2171.0, 3318.0, 5392.0, 8738.0, 14481.0, 24041.0, 39770.0, 66124.0, 106717.0, 154195.0, 180168.0, 157073.0, 109251.0, 68264.0, 40839.0, 24790.0, 14823.0, 9247.0, 5498.0, 3453.0, 2183.0, 1378.0, 902.0, 605.0, 385.0, 248.0, 176.0, 123.0, 69.0, 72.0, 45.0, 31.0, 22.0, 9.0, 13.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.5400390625, -0.5234375, -0.5068359375, -0.490234375, -0.4736328125, -0.45703125, -0.4404296875, -0.423828125, -0.4072265625, -0.390625, -0.3740234375, -0.357421875, -0.3408203125, -0.32421875, -0.3076171875, -0.291015625, -0.2744140625, -0.2578125, -0.2412109375, -0.224609375, -0.2080078125, -0.19140625, -0.1748046875, -0.158203125, -0.1416015625, -0.125, -0.1083984375, -0.091796875, -0.0751953125, -0.05859375, -0.0419921875, -0.025390625, -0.0087890625, 0.0078125, 0.0244140625, 0.041015625, 0.0576171875, 0.07421875, 0.0908203125, 0.107421875, 0.1240234375, 0.140625, 0.1572265625, 0.173828125, 0.1904296875, 0.20703125, 0.2236328125, 0.240234375, 0.2568359375, 0.2734375, 0.2900390625, 0.306640625, 0.3232421875, 0.33984375, 0.3564453125, 0.373046875, 0.3896484375, 0.40625, 0.4228515625, 0.439453125, 0.4560546875, 0.47265625, 0.4892578125, 0.505859375, 0.5224609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 6.0, 7.0, 5.0, 5.0, 12.0, 17.0, 10.0, 20.0, 36.0, 31.0, 54.0, 73.0, 91.0, 113.0, 123.0, 109.0, 79.0, 63.0, 35.0, 32.0, 18.0, 11.0, 18.0, 10.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004665851593017578, -0.00045154616236686707, -0.0004365071654319763, -0.00042146816849708557, -0.0004064291715621948, -0.0003913901746273041, -0.00037635117769241333, -0.0003613121807575226, -0.00034627318382263184, -0.0003312341868877411, -0.00031619518995285034, -0.0003011561930179596, -0.00028611719608306885, -0.0002710781991481781, -0.00025603920221328735, -0.0002410002052783966, -0.00022596120834350586, -0.0002109222114086151, -0.00019588321447372437, -0.00018084421753883362, -0.00016580522060394287, -0.00015076622366905212, -0.00013572722673416138, -0.00012068822979927063, -0.00010564923286437988, -9.061023592948914e-05, -7.557123899459839e-05, -6.053224205970764e-05, -4.5493245124816895e-05, -3.0454248189926147e-05, -1.54152512550354e-05, -3.762543201446533e-07, 1.4662742614746094e-05, 2.970173954963684e-05, 4.474073648452759e-05, 5.9779733419418335e-05, 7.481873035430908e-05, 8.985772728919983e-05, 0.00010489672422409058, 0.00011993572115898132, 0.00013497471809387207, 0.00015001371502876282, 0.00016505271196365356, 0.0001800917088985443, 0.00019513070583343506, 0.0002101697027683258, 0.00022520869970321655, 0.0002402476966381073, 0.00025528669357299805, 0.0002703256905078888, 0.00028536468744277954, 0.0003004036843776703, 0.00031544268131256104, 0.0003304816782474518, 0.00034552067518234253, 0.0003605596721172333, 0.000375598669052124, 0.00039063766598701477, 0.0004056766629219055, 0.00042071565985679626, 0.000435754656791687, 0.00045079365372657776, 0.0004658326506614685, 0.00048087164759635925, 0.00049591064453125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 10.0, 9.0, 19.0, 24.0, 52.0, 74.0, 124.0, 200.0, 343.0, 543.0, 999.0, 1878.0, 3567.0, 6981.0, 13505.0, 26917.0, 53218.0, 99926.0, 167074.0, 215270.0, 191529.0, 124917.0, 68872.0, 35486.0, 17753.0, 9048.0, 4675.0, 2491.0, 1295.0, 734.0, 409.0, 225.0, 145.0, 70.0, 40.0, 39.0, 29.0, 19.0, 16.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.7158203125, -0.6951904296875, -0.674560546875, -0.6539306640625, -0.63330078125, -0.6126708984375, -0.592041015625, -0.5714111328125, -0.55078125, -0.5301513671875, -0.509521484375, -0.4888916015625, -0.46826171875, -0.4476318359375, -0.427001953125, -0.4063720703125, -0.3857421875, -0.3651123046875, -0.344482421875, -0.3238525390625, -0.30322265625, -0.2825927734375, -0.261962890625, -0.2413330078125, -0.220703125, -0.2000732421875, -0.179443359375, -0.1588134765625, -0.13818359375, -0.1175537109375, -0.096923828125, -0.0762939453125, -0.0556640625, -0.0350341796875, -0.014404296875, 0.0062255859375, 0.02685546875, 0.0474853515625, 0.068115234375, 0.0887451171875, 0.109375, 0.1300048828125, 0.150634765625, 0.1712646484375, 0.19189453125, 0.2125244140625, 0.233154296875, 0.2537841796875, 0.2744140625, 0.2950439453125, 0.315673828125, 0.3363037109375, 0.35693359375, 0.3775634765625, 0.398193359375, 0.4188232421875, 0.439453125, 0.4600830078125, 0.480712890625, 0.5013427734375, 0.52197265625, 0.5426025390625, 0.563232421875, 0.5838623046875, 0.6044921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 7.0, 6.0, 9.0, 9.0, 14.0, 21.0, 12.0, 22.0, 24.0, 22.0, 28.0, 40.0, 46.0, 43.0, 39.0, 40.0, 68.0, 58.0, 40.0, 40.0, 48.0, 41.0, 52.0, 49.0, 38.0, 29.0, 28.0, 27.0, 11.0, 15.0, 9.0, 9.0, 8.0, 14.0, 9.0, 7.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.92822265625, -0.9015960693359375, -0.874969482421875, -0.8483428955078125, -0.82171630859375, -0.7950897216796875, -0.768463134765625, -0.7418365478515625, -0.7152099609375, -0.6885833740234375, -0.661956787109375, -0.6353302001953125, -0.60870361328125, -0.5820770263671875, -0.555450439453125, -0.5288238525390625, -0.502197265625, -0.4755706787109375, -0.448944091796875, -0.4223175048828125, -0.39569091796875, -0.3690643310546875, -0.342437744140625, -0.3158111572265625, -0.2891845703125, -0.2625579833984375, -0.235931396484375, -0.2093048095703125, -0.18267822265625, -0.1560516357421875, -0.129425048828125, -0.1027984619140625, -0.076171875, -0.0495452880859375, -0.022918701171875, 0.0037078857421875, 0.03033447265625, 0.0569610595703125, 0.083587646484375, 0.1102142333984375, 0.1368408203125, 0.1634674072265625, 0.190093994140625, 0.2167205810546875, 0.24334716796875, 0.2699737548828125, 0.296600341796875, 0.3232269287109375, 0.349853515625, 0.3764801025390625, 0.403106689453125, 0.4297332763671875, 0.45635986328125, 0.4829864501953125, 0.509613037109375, 0.5362396240234375, 0.5628662109375, 0.5894927978515625, 0.616119384765625, 0.6427459716796875, 0.66937255859375, 0.6959991455078125, 0.722625732421875, 0.7492523193359375, 0.77587890625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 12.0, 4.0, 17.0, 30.0, 38.0, 65.0, 116.0, 142.0, 163.0, 138.0, 105.0, 69.0, 30.0, 23.0, 13.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-24.56344985961914, -23.81045913696289, -23.05746841430664, -22.30447769165039, -21.55148696899414, -20.798498153686523, -20.045507431030273, -19.292516708374023, -18.539525985717773, -17.786535263061523, -17.033544540405273, -16.280553817749023, -15.52756404876709, -14.77457332611084, -14.021583557128906, -13.268592834472656, -12.515602111816406, -11.762611389160156, -11.009620666503906, -10.256630897521973, -9.503640174865723, -8.750649452209473, -7.997659206390381, -7.244668960571289, -6.491678237915039, -5.738687515258789, -4.985697269439697, -4.2327070236206055, -3.4797163009643555, -2.7267258167266846, -1.9737353324890137, -1.2207450866699219, -0.46775245666503906, 0.28523802757263184, 1.0382285118103027, 1.7912189960479736, 2.5442094802856445, 3.2971999645233154, 4.050190448760986, 4.803180694580078, 5.556171417236328, 6.309162139892578, 7.06215238571167, 7.815142631530762, 8.568133354187012, 9.321124076843262, 10.074113845825195, 10.827104568481445, 11.580095291137695, 12.333086013793945, 13.086076736450195, 13.839066505432129, 14.592057228088379, 15.345047950744629, 16.098037719726562, 16.851028442382812, 17.604019165039062, 18.357009887695312, 19.110000610351562, 19.862991333007812, 20.615982055664062, 21.36897087097168, 22.12196159362793, 22.87495231628418, 23.62794303894043]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 9.0, 13.0, 18.0, 13.0, 13.0, 23.0, 21.0, 19.0, 26.0, 30.0, 39.0, 35.0, 44.0, 34.0, 45.0, 37.0, 38.0, 35.0, 38.0, 44.0, 43.0, 32.0, 36.0, 26.0, 35.0, 27.0, 33.0, 23.0, 23.0, 18.0, 17.0, 15.0, 14.0, 16.0, 8.0, 8.0, 14.0, 6.0, 4.0, 2.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.432417869567871, -10.983609199523926, -10.534799575805664, -10.085990905761719, -9.637182235717773, -9.188373565673828, -8.739563941955566, -8.290755271911621, -7.841946125030518, -7.393136978149414, -6.944328308105469, -6.495519161224365, -6.046710014343262, -5.597901344299316, -5.149092197418213, -4.700283050537109, -4.251474380493164, -3.8026654720306396, -3.3538565635681152, -2.9050474166870117, -2.4562385082244873, -2.007429599761963, -1.5586204528808594, -1.109811544418335, -0.6610026359558105, -0.21219366788864136, 0.23661530017852783, 0.6854243278503418, 1.1342332363128662, 1.5830421447753906, 2.031851291656494, 2.4806602001190186, 2.9294700622558594, 3.378278970718384, 3.827087879180908, 4.275897026062012, 4.724705696105957, 5.1735148429870605, 5.622323989868164, 6.071132659912109, 6.519941806793213, 6.968750953674316, 7.417559623718262, 7.866368770599365, 8.315177917480469, 8.763986587524414, 9.21279525756836, 9.661604881286621, 10.110413551330566, 10.559222221374512, 11.008031845092773, 11.456840515136719, 11.905649185180664, 12.35445785522461, 12.803267478942871, 13.252076148986816, 13.700885772705078, 14.149694442749023, 14.598504066467285, 15.04731273651123, 15.496121406555176, 15.944931030273438, 16.393739700317383, 16.842548370361328, 17.291357040405273]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 8.0, 15.0, 17.0, 49.0, 60.0, 75.0, 179.0, 246.0, 477.0, 912.0, 1983.0, 4265.0, 10179.0, 27170.0, 85078.0, 302368.0, 923855.0, 1538689.0, 899975.0, 281929.0, 75787.0, 24166.0, 9148.0, 3909.0, 1766.0, 856.0, 476.0, 282.0, 150.0, 77.0, 53.0, 25.0, 28.0, 13.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.98455810546875, -1.9066162109375, -1.82867431640625, -1.750732421875, -1.67279052734375, -1.5948486328125, -1.51690673828125, -1.43896484375, -1.36102294921875, -1.2830810546875, -1.20513916015625, -1.127197265625, -1.04925537109375, -0.9713134765625, -0.89337158203125, -0.8154296875, -0.73748779296875, -0.6595458984375, -0.58160400390625, -0.503662109375, -0.42572021484375, -0.3477783203125, -0.26983642578125, -0.19189453125, -0.11395263671875, -0.0360107421875, 0.04193115234375, 0.119873046875, 0.19781494140625, 0.2757568359375, 0.35369873046875, 0.431640625, 0.50958251953125, 0.5875244140625, 0.66546630859375, 0.743408203125, 0.82135009765625, 0.8992919921875, 0.97723388671875, 1.05517578125, 1.13311767578125, 1.2110595703125, 1.28900146484375, 1.366943359375, 1.44488525390625, 1.5228271484375, 1.60076904296875, 1.6787109375, 1.75665283203125, 1.8345947265625, 1.91253662109375, 1.990478515625, 2.06842041015625, 2.1463623046875, 2.22430419921875, 2.30224609375, 2.38018798828125, 2.4581298828125, 2.53607177734375, 2.614013671875, 2.69195556640625, 2.7698974609375, 2.84783935546875, 2.92578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 10.0, 17.0, 8.0, 11.0, 22.0, 23.0, 14.0, 30.0, 33.0, 31.0, 37.0, 36.0, 32.0, 36.0, 38.0, 43.0, 40.0, 36.0, 42.0, 40.0, 39.0, 39.0, 45.0, 36.0, 37.0, 30.0, 26.0, 19.0, 12.0, 21.0, 24.0, 18.0, 13.0, 9.0, 15.0, 7.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.81640625, -1.75372314453125, -1.6910400390625, -1.62835693359375, -1.565673828125, -1.50299072265625, -1.4403076171875, -1.37762451171875, -1.31494140625, -1.25225830078125, -1.1895751953125, -1.12689208984375, -1.064208984375, -1.00152587890625, -0.9388427734375, -0.87615966796875, -0.8134765625, -0.75079345703125, -0.6881103515625, -0.62542724609375, -0.562744140625, -0.50006103515625, -0.4373779296875, -0.37469482421875, -0.31201171875, -0.24932861328125, -0.1866455078125, -0.12396240234375, -0.061279296875, 0.00140380859375, 0.0640869140625, 0.12677001953125, 0.189453125, 0.25213623046875, 0.3148193359375, 0.37750244140625, 0.440185546875, 0.50286865234375, 0.5655517578125, 0.62823486328125, 0.69091796875, 0.75360107421875, 0.8162841796875, 0.87896728515625, 0.941650390625, 1.00433349609375, 1.0670166015625, 1.12969970703125, 1.1923828125, 1.25506591796875, 1.3177490234375, 1.38043212890625, 1.443115234375, 1.50579833984375, 1.5684814453125, 1.63116455078125, 1.69384765625, 1.75653076171875, 1.8192138671875, 1.88189697265625, 1.944580078125, 2.00726318359375, 2.0699462890625, 2.13262939453125, 2.1953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 9.0, 9.0, 20.0, 24.0, 35.0, 57.0, 115.0, 210.0, 389.0, 820.0, 1758.0, 4138.0, 11838.0, 38225.0, 154735.0, 917048.0, 2420646.0, 505622.0, 98044.0, 26110.0, 8517.0, 3244.0, 1328.0, 648.0, 265.0, 170.0, 86.0, 68.0, 32.0, 21.0, 15.0, 14.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.611328125, -2.499481201171875, -2.38763427734375, -2.275787353515625, -2.1639404296875, -2.052093505859375, -1.94024658203125, -1.828399658203125, -1.716552734375, -1.604705810546875, -1.49285888671875, -1.381011962890625, -1.2691650390625, -1.157318115234375, -1.04547119140625, -0.933624267578125, -0.82177734375, -0.709930419921875, -0.59808349609375, -0.486236572265625, -0.3743896484375, -0.262542724609375, -0.15069580078125, -0.038848876953125, 0.072998046875, 0.184844970703125, 0.29669189453125, 0.408538818359375, 0.5203857421875, 0.632232666015625, 0.74407958984375, 0.855926513671875, 0.9677734375, 1.079620361328125, 1.19146728515625, 1.303314208984375, 1.4151611328125, 1.527008056640625, 1.63885498046875, 1.750701904296875, 1.862548828125, 1.974395751953125, 2.08624267578125, 2.198089599609375, 2.3099365234375, 2.421783447265625, 2.53363037109375, 2.645477294921875, 2.75732421875, 2.869171142578125, 2.98101806640625, 3.092864990234375, 3.2047119140625, 3.316558837890625, 3.42840576171875, 3.540252685546875, 3.652099609375, 3.763946533203125, 3.87579345703125, 3.987640380859375, 4.0994873046875, 4.211334228515625, 4.32318115234375, 4.435028076171875, 4.546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 10.0, 24.0, 14.0, 39.0, 51.0, 91.0, 114.0, 177.0, 295.0, 485.0, 692.0, 693.0, 519.0, 323.0, 182.0, 111.0, 83.0, 52.0, 41.0, 29.0, 20.0, 13.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.8076171875, -5.646484375, -5.4853515625, -5.32421875, -5.1630859375, -5.001953125, -4.8408203125, -4.6796875, -4.5185546875, -4.357421875, -4.1962890625, -4.03515625, -3.8740234375, -3.712890625, -3.5517578125, -3.390625, -3.2294921875, -3.068359375, -2.9072265625, -2.74609375, -2.5849609375, -2.423828125, -2.2626953125, -2.1015625, -1.9404296875, -1.779296875, -1.6181640625, -1.45703125, -1.2958984375, -1.134765625, -0.9736328125, -0.8125, -0.6513671875, -0.490234375, -0.3291015625, -0.16796875, -0.0068359375, 0.154296875, 0.3154296875, 0.4765625, 0.6376953125, 0.798828125, 0.9599609375, 1.12109375, 1.2822265625, 1.443359375, 1.6044921875, 1.765625, 1.9267578125, 2.087890625, 2.2490234375, 2.41015625, 2.5712890625, 2.732421875, 2.8935546875, 3.0546875, 3.2158203125, 3.376953125, 3.5380859375, 3.69921875, 3.8603515625, 4.021484375, 4.1826171875, 4.34375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 11.0, 14.0, 37.0, 111.0, 184.0, 224.0, 200.0, 117.0, 52.0, 26.0, 12.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.118736267089844, -50.80192565917969, -49.48511505126953, -48.16830825805664, -46.851497650146484, -45.53468704223633, -44.21787643432617, -42.901065826416016, -41.584259033203125, -40.26744842529297, -38.95063781738281, -37.63383102416992, -36.317020416259766, -35.00020980834961, -33.68339920043945, -32.3665885925293, -31.04977798461914, -29.732967376708984, -28.41615867614746, -27.099348068237305, -25.78253936767578, -24.465728759765625, -23.14891815185547, -21.832107543945312, -20.51529884338379, -19.198488235473633, -17.88167953491211, -16.564868927001953, -15.248059272766113, -13.931249618530273, -12.614439010620117, -11.297629356384277, -9.980815887451172, -8.664006233215332, -7.347196102142334, -6.030385971069336, -4.713576316833496, -3.3967666625976562, -2.079956531524658, -0.7631464004516602, 0.5536632537841797, 1.8704731464385986, 3.1872830390930176, 4.504093170166016, 5.8209028244018555, 7.137712478637695, 8.454523086547852, 9.771332740783691, 11.088142395019531, 12.404952049255371, 13.721761703491211, 15.038572311401367, 16.35538101196289, 17.672191619873047, 18.989002227783203, 20.30581283569336, 21.622621536254883, 22.93943214416504, 24.256240844726562, 25.57305145263672, 26.889862060546875, 28.2066707611084, 29.523481369018555, 30.840290069580078, 32.157100677490234]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 10.0, 8.0, 9.0, 5.0, 9.0, 16.0, 16.0, 19.0, 25.0, 23.0, 19.0, 21.0, 33.0, 34.0, 26.0, 42.0, 28.0, 43.0, 46.0, 37.0, 36.0, 43.0, 34.0, 48.0, 36.0, 34.0, 28.0, 25.0, 30.0, 27.0, 15.0, 20.0, 16.0, 29.0, 13.0, 12.0, 11.0, 12.0, 11.0, 12.0, 11.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.721087455749512, -9.388763427734375, -9.056439399719238, -8.724115371704102, -8.391791343688965, -8.059467315673828, -7.727143287658691, -7.394819259643555, -7.062495231628418, -6.730171203613281, -6.3978471755981445, -6.065523147583008, -5.733199119567871, -5.400875091552734, -5.068551063537598, -4.736227035522461, -4.403903007507324, -4.0715789794921875, -3.739254951477051, -3.406930923461914, -3.0746068954467773, -2.7422828674316406, -2.409958839416504, -2.077634811401367, -1.7453107833862305, -1.4129867553710938, -1.080662727355957, -0.7483386993408203, -0.4160146713256836, -0.08369064331054688, 0.24863338470458984, 0.5809574127197266, 0.9132823944091797, 1.2456064224243164, 1.5779304504394531, 1.9102544784545898, 2.2425785064697266, 2.5749025344848633, 2.9072265625, 3.2395505905151367, 3.5718746185302734, 3.90419864654541, 4.236522674560547, 4.568846702575684, 4.90117073059082, 5.233494758605957, 5.565818786621094, 5.8981428146362305, 6.230466842651367, 6.562790870666504, 6.895114898681641, 7.227438926696777, 7.559762954711914, 7.892086982727051, 8.224411010742188, 8.556735038757324, 8.889059066772461, 9.221383094787598, 9.553707122802734, 9.886031150817871, 10.218355178833008, 10.550679206848145, 10.883003234863281, 11.215327262878418, 11.547651290893555]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 14.0, 17.0, 19.0, 26.0, 35.0, 71.0, 90.0, 158.0, 227.0, 392.0, 627.0, 1018.0, 1719.0, 3138.0, 5530.0, 9809.0, 17835.0, 32235.0, 56536.0, 94467.0, 142666.0, 179776.0, 173785.0, 131081.0, 84438.0, 49586.0, 28143.0, 15174.0, 8393.0, 4755.0, 2822.0, 1544.0, 908.0, 562.0, 317.0, 237.0, 147.0, 78.0, 57.0, 43.0, 26.0, 17.0, 16.0, 9.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.6982421875, -1.6481170654296875, -1.597991943359375, -1.5478668212890625, -1.49774169921875, -1.4476165771484375, -1.397491455078125, -1.3473663330078125, -1.2972412109375, -1.2471160888671875, -1.196990966796875, -1.1468658447265625, -1.09674072265625, -1.0466156005859375, -0.996490478515625, -0.9463653564453125, -0.896240234375, -0.8461151123046875, -0.795989990234375, -0.7458648681640625, -0.69573974609375, -0.6456146240234375, -0.595489501953125, -0.5453643798828125, -0.4952392578125, -0.4451141357421875, -0.394989013671875, -0.3448638916015625, -0.29473876953125, -0.2446136474609375, -0.194488525390625, -0.1443634033203125, -0.09423828125, -0.0441131591796875, 0.006011962890625, 0.0561370849609375, 0.10626220703125, 0.1563873291015625, 0.206512451171875, 0.2566375732421875, 0.3067626953125, 0.3568878173828125, 0.407012939453125, 0.4571380615234375, 0.50726318359375, 0.5573883056640625, 0.607513427734375, 0.6576385498046875, 0.707763671875, 0.7578887939453125, 0.808013916015625, 0.8581390380859375, 0.90826416015625, 0.9583892822265625, 1.008514404296875, 1.0586395263671875, 1.1087646484375, 1.1588897705078125, 1.209014892578125, 1.2591400146484375, 1.30926513671875, 1.3593902587890625, 1.409515380859375, 1.4596405029296875, 1.509765625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 6.0, 9.0, 6.0, 9.0, 13.0, 16.0, 12.0, 11.0, 37.0, 34.0, 33.0, 44.0, 46.0, 37.0, 38.0, 54.0, 44.0, 46.0, 60.0, 42.0, 45.0, 37.0, 51.0, 33.0, 45.0, 30.0, 28.0, 26.0, 16.0, 24.0, 25.0, 8.0, 10.0, 11.0, 4.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.4298095703125, -2.345947265625, -2.2620849609375, -2.17822265625, -2.0943603515625, -2.010498046875, -1.9266357421875, -1.8427734375, -1.7589111328125, -1.675048828125, -1.5911865234375, -1.50732421875, -1.4234619140625, -1.339599609375, -1.2557373046875, -1.171875, -1.0880126953125, -1.004150390625, -0.9202880859375, -0.83642578125, -0.7525634765625, -0.668701171875, -0.5848388671875, -0.5009765625, -0.4171142578125, -0.333251953125, -0.2493896484375, -0.16552734375, -0.0816650390625, 0.002197265625, 0.0860595703125, 0.169921875, 0.2537841796875, 0.337646484375, 0.4215087890625, 0.50537109375, 0.5892333984375, 0.673095703125, 0.7569580078125, 0.8408203125, 0.9246826171875, 1.008544921875, 1.0924072265625, 1.17626953125, 1.2601318359375, 1.343994140625, 1.4278564453125, 1.51171875, 1.5955810546875, 1.679443359375, 1.7633056640625, 1.84716796875, 1.9310302734375, 2.014892578125, 2.0987548828125, 2.1826171875, 2.2664794921875, 2.350341796875, 2.4342041015625, 2.51806640625, 2.6019287109375, 2.685791015625, 2.7696533203125, 2.853515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 11.0, 9.0, 21.0, 28.0, 35.0, 69.0, 87.0, 174.0, 292.0, 391.0, 779.0, 1372.0, 2581.0, 5082.0, 10533.0, 22475.0, 48468.0, 103472.0, 197783.0, 287824.0, 186216.0, 95276.0, 44730.0, 20447.0, 9808.0, 4865.0, 2445.0, 1381.0, 719.0, 436.0, 281.0, 178.0, 106.0, 59.0, 37.0, 23.0, 22.0, 4.0, 8.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.236328125, -2.169464111328125, -2.10260009765625, -2.035736083984375, -1.9688720703125, -1.902008056640625, -1.83514404296875, -1.768280029296875, -1.701416015625, -1.634552001953125, -1.56768798828125, -1.500823974609375, -1.4339599609375, -1.367095947265625, -1.30023193359375, -1.233367919921875, -1.16650390625, -1.099639892578125, -1.03277587890625, -0.965911865234375, -0.8990478515625, -0.832183837890625, -0.76531982421875, -0.698455810546875, -0.631591796875, -0.564727783203125, -0.49786376953125, -0.430999755859375, -0.3641357421875, -0.297271728515625, -0.23040771484375, -0.163543701171875, -0.0966796875, -0.029815673828125, 0.03704833984375, 0.103912353515625, 0.1707763671875, 0.237640380859375, 0.30450439453125, 0.371368408203125, 0.438232421875, 0.505096435546875, 0.57196044921875, 0.638824462890625, 0.7056884765625, 0.772552490234375, 0.83941650390625, 0.906280517578125, 0.97314453125, 1.040008544921875, 1.10687255859375, 1.173736572265625, 1.2406005859375, 1.307464599609375, 1.37432861328125, 1.441192626953125, 1.508056640625, 1.574920654296875, 1.64178466796875, 1.708648681640625, 1.7755126953125, 1.842376708984375, 1.90924072265625, 1.976104736328125, 2.04296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 11.0, 17.0, 26.0, 14.0, 15.0, 22.0, 25.0, 30.0, 33.0, 33.0, 50.0, 38.0, 42.0, 39.0, 49.0, 38.0, 36.0, 43.0, 40.0, 46.0, 42.0, 48.0, 35.0, 30.0, 29.0, 20.0, 19.0, 14.0, 17.0, 19.0, 15.0, 10.0, 7.0, 2.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.9453125, -5.7509765625, -5.556640625, -5.3623046875, -5.16796875, -4.9736328125, -4.779296875, -4.5849609375, -4.390625, -4.1962890625, -4.001953125, -3.8076171875, -3.61328125, -3.4189453125, -3.224609375, -3.0302734375, -2.8359375, -2.6416015625, -2.447265625, -2.2529296875, -2.05859375, -1.8642578125, -1.669921875, -1.4755859375, -1.28125, -1.0869140625, -0.892578125, -0.6982421875, -0.50390625, -0.3095703125, -0.115234375, 0.0791015625, 0.2734375, 0.4677734375, 0.662109375, 0.8564453125, 1.05078125, 1.2451171875, 1.439453125, 1.6337890625, 1.828125, 2.0224609375, 2.216796875, 2.4111328125, 2.60546875, 2.7998046875, 2.994140625, 3.1884765625, 3.3828125, 3.5771484375, 3.771484375, 3.9658203125, 4.16015625, 4.3544921875, 4.548828125, 4.7431640625, 4.9375, 5.1318359375, 5.326171875, 5.5205078125, 5.71484375, 5.9091796875, 6.103515625, 6.2978515625, 6.4921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 10.0, 10.0, 12.0, 21.0, 31.0, 49.0, 71.0, 105.0, 157.0, 262.0, 406.0, 741.0, 1364.0, 2185.0, 4118.0, 7388.0, 13546.0, 25270.0, 46254.0, 81642.0, 136890.0, 225735.0, 199118.0, 130203.0, 77388.0, 43479.0, 23528.0, 12728.0, 6727.0, 3880.0, 2082.0, 1264.0, 724.0, 441.0, 267.0, 170.0, 98.0, 55.0, 37.0, 22.0, 22.0, 8.0, 14.0, 5.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.395263671875, -0.3824920654296875, -0.369720458984375, -0.3569488525390625, -0.34417724609375, -0.3314056396484375, -0.318634033203125, -0.3058624267578125, -0.2930908203125, -0.2803192138671875, -0.267547607421875, -0.2547760009765625, -0.24200439453125, -0.2292327880859375, -0.216461181640625, -0.2036895751953125, -0.19091796875, -0.1781463623046875, -0.165374755859375, -0.1526031494140625, -0.13983154296875, -0.1270599365234375, -0.114288330078125, -0.1015167236328125, -0.0887451171875, -0.0759735107421875, -0.063201904296875, -0.0504302978515625, -0.03765869140625, -0.0248870849609375, -0.012115478515625, 0.0006561279296875, 0.013427734375, 0.0261993408203125, 0.038970947265625, 0.0517425537109375, 0.06451416015625, 0.0772857666015625, 0.090057373046875, 0.1028289794921875, 0.1156005859375, 0.1283721923828125, 0.141143798828125, 0.1539154052734375, 0.16668701171875, 0.1794586181640625, 0.192230224609375, 0.2050018310546875, 0.2177734375, 0.2305450439453125, 0.243316650390625, 0.2560882568359375, 0.26885986328125, 0.2816314697265625, 0.294403076171875, 0.3071746826171875, 0.3199462890625, 0.3327178955078125, 0.345489501953125, 0.3582611083984375, 0.37103271484375, 0.3838043212890625, 0.396575927734375, 0.4093475341796875, 0.422119140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 3.0, 6.0, 15.0, 19.0, 18.0, 25.0, 35.0, 35.0, 39.0, 34.0, 38.0, 64.0, 52.0, 74.0, 62.0, 67.0, 52.0, 60.0, 50.0, 47.0, 23.0, 30.0, 24.0, 19.0, 18.0, 21.0, 6.0, 9.0, 7.0, 8.0, 5.0, 2.0, 2.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002390146255493164, -0.00023225508630275726, -0.00022549554705619812, -0.00021873600780963898, -0.00021197646856307983, -0.0002052169293165207, -0.00019845739006996155, -0.0001916978508234024, -0.00018493831157684326, -0.00017817877233028412, -0.00017141923308372498, -0.00016465969383716583, -0.0001579001545906067, -0.00015114061534404755, -0.0001443810760974884, -0.00013762153685092926, -0.00013086199760437012, -0.00012410245835781097, -0.00011734291911125183, -0.00011058337986469269, -0.00010382384061813354, -9.70643013715744e-05, -9.030476212501526e-05, -8.354522287845612e-05, -7.678568363189697e-05, -7.002614438533783e-05, -6.326660513877869e-05, -5.6507065892219543e-05, -4.97475266456604e-05, -4.298798739910126e-05, -3.6228448152542114e-05, -2.946890890598297e-05, -2.2709369659423828e-05, -1.5949830412864685e-05, -9.190291166305542e-06, -2.430751919746399e-06, 4.328787326812744e-06, 1.1088326573371887e-05, 1.784786581993103e-05, 2.4607405066490173e-05, 3.1366944313049316e-05, 3.812648355960846e-05, 4.48860228061676e-05, 5.1645562052726746e-05, 5.840510129928589e-05, 6.516464054584503e-05, 7.192417979240417e-05, 7.868371903896332e-05, 8.544325828552246e-05, 9.22027975320816e-05, 9.896233677864075e-05, 0.00010572187602519989, 0.00011248141527175903, 0.00011924095451831818, 0.00012600049376487732, 0.00013276003301143646, 0.0001395195722579956, 0.00014627911150455475, 0.0001530386507511139, 0.00015979818999767303, 0.00016655772924423218, 0.00017331726849079132, 0.00018007680773735046, 0.0001868363469839096, 0.00019359588623046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 9.0, 17.0, 20.0, 33.0, 64.0, 119.0, 218.0, 364.0, 753.0, 1404.0, 2765.0, 5753.0, 11500.0, 23738.0, 46743.0, 88468.0, 152532.0, 246640.0, 199260.0, 125629.0, 70355.0, 36279.0, 18263.0, 8822.0, 4355.0, 2136.0, 1049.0, 550.0, 312.0, 161.0, 91.0, 64.0, 30.0, 21.0, 10.0, 6.0, 8.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.55859375, -0.5434188842773438, -0.5282440185546875, -0.5130691528320312, -0.497894287109375, -0.48271942138671875, -0.4675445556640625, -0.45236968994140625, -0.43719482421875, -0.42201995849609375, -0.4068450927734375, -0.39167022705078125, -0.376495361328125, -0.36132049560546875, -0.3461456298828125, -0.33097076416015625, -0.3157958984375, -0.30062103271484375, -0.2854461669921875, -0.27027130126953125, -0.255096435546875, -0.23992156982421875, -0.2247467041015625, -0.20957183837890625, -0.19439697265625, -0.17922210693359375, -0.1640472412109375, -0.14887237548828125, -0.133697509765625, -0.11852264404296875, -0.1033477783203125, -0.08817291259765625, -0.072998046875, -0.05782318115234375, -0.0426483154296875, -0.02747344970703125, -0.012298583984375, 0.00287628173828125, 0.0180511474609375, 0.03322601318359375, 0.04840087890625, 0.06357574462890625, 0.0787506103515625, 0.09392547607421875, 0.109100341796875, 0.12427520751953125, 0.1394500732421875, 0.15462493896484375, 0.1697998046875, 0.18497467041015625, 0.2001495361328125, 0.21532440185546875, 0.230499267578125, 0.24567413330078125, 0.2608489990234375, 0.27602386474609375, 0.29119873046875, 0.30637359619140625, 0.3215484619140625, 0.33672332763671875, 0.351898193359375, 0.36707305908203125, 0.3822479248046875, 0.39742279052734375, 0.41259765625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 3.0, 5.0, 4.0, 3.0, 7.0, 14.0, 9.0, 10.0, 20.0, 18.0, 18.0, 22.0, 35.0, 32.0, 34.0, 26.0, 45.0, 48.0, 48.0, 47.0, 50.0, 56.0, 54.0, 50.0, 52.0, 41.0, 34.0, 29.0, 47.0, 25.0, 21.0, 14.0, 12.0, 15.0, 6.0, 9.0, 6.0, 5.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.599609375, -0.5784912109375, -0.557373046875, -0.5362548828125, -0.51513671875, -0.4940185546875, -0.472900390625, -0.4517822265625, -0.4306640625, -0.4095458984375, -0.388427734375, -0.3673095703125, -0.34619140625, -0.3250732421875, -0.303955078125, -0.2828369140625, -0.26171875, -0.2406005859375, -0.219482421875, -0.1983642578125, -0.17724609375, -0.1561279296875, -0.135009765625, -0.1138916015625, -0.0927734375, -0.0716552734375, -0.050537109375, -0.0294189453125, -0.00830078125, 0.0128173828125, 0.033935546875, 0.0550537109375, 0.076171875, 0.0972900390625, 0.118408203125, 0.1395263671875, 0.16064453125, 0.1817626953125, 0.202880859375, 0.2239990234375, 0.2451171875, 0.2662353515625, 0.287353515625, 0.3084716796875, 0.32958984375, 0.3507080078125, 0.371826171875, 0.3929443359375, 0.4140625, 0.4351806640625, 0.456298828125, 0.4774169921875, 0.49853515625, 0.5196533203125, 0.540771484375, 0.5618896484375, 0.5830078125, 0.6041259765625, 0.625244140625, 0.6463623046875, 0.66748046875, 0.6885986328125, 0.709716796875, 0.7308349609375, 0.751953125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 6.0, 8.0, 16.0, 20.0, 29.0, 69.0, 121.0, 136.0, 167.0, 144.0, 120.0, 60.0, 52.0, 19.0, 12.0, 11.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.49358558654785, -19.80167579650879, -19.10976791381836, -18.417858123779297, -17.725950241088867, -17.034040451049805, -16.342132568359375, -15.650222778320312, -14.95831298828125, -14.266404151916504, -13.574495315551758, -12.882585525512695, -12.19067668914795, -11.498767852783203, -10.806859016418457, -10.114950180053711, -9.423041343688965, -8.731132507324219, -8.039223670959473, -7.347314357757568, -6.655405044555664, -5.963496208190918, -5.271587371826172, -4.579678058624268, -3.8877692222595215, -3.1958601474761963, -2.503951072692871, -1.812042236328125, -1.1201331615447998, -0.4282240867614746, 0.2636847496032715, 0.9555940628051758, 1.6475028991699219, 2.339411973953247, 3.0313210487365723, 3.7232298851013184, 4.415139198303223, 5.107048034667969, 5.798956871032715, 6.490866184234619, 7.182775020599365, 7.874683856964111, 8.566593170166016, 9.258502006530762, 9.950410842895508, 10.64232063293457, 11.334228515625, 12.026138305664062, 12.718047142028809, 13.409955978393555, 14.1018648147583, 14.793773651123047, 15.48568344116211, 16.177593231201172, 16.8695011138916, 17.561410903930664, 18.253318786621094, 18.945228576660156, 19.637136459350586, 20.32904624938965, 21.020954132080078, 21.71286392211914, 22.404773712158203, 23.096681594848633, 23.788591384887695]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 3.0, 4.0, 16.0, 8.0, 16.0, 23.0, 25.0, 21.0, 18.0, 26.0, 38.0, 31.0, 35.0, 34.0, 35.0, 31.0, 47.0, 43.0, 41.0, 52.0, 42.0, 46.0, 39.0, 34.0, 26.0, 39.0, 31.0, 28.0, 31.0, 25.0, 23.0, 16.0, 9.0, 9.0, 7.0, 9.0, 8.0, 3.0, 4.0, 3.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.553396224975586, -15.088220596313477, -14.623044967651367, -14.157869338989258, -13.692693710327148, -13.227518081665039, -12.762343406677246, -12.297167778015137, -11.831992149353027, -11.366816520690918, -10.901640892028809, -10.4364652633667, -9.971290588378906, -9.506114959716797, -9.040939331054688, -8.575763702392578, -8.110588073730469, -7.645412445068359, -7.18023681640625, -6.715061664581299, -6.2498860359191895, -5.78471040725708, -5.319535255432129, -4.8543596267700195, -4.38918399810791, -3.924008369445801, -3.4588329792022705, -2.9936575889587402, -2.528481960296631, -2.0633063316345215, -1.5981309413909912, -1.132955551147461, -0.667780876159668, -0.20260536670684814, 0.2625701427459717, 0.7277456521987915, 1.1929211616516113, 1.6580967903137207, 2.123272180557251, 2.5884475708007812, 3.0536231994628906, 3.518798828125, 3.9839742183685303, 4.4491496086120605, 4.91432523727417, 5.379500865936279, 5.8446760177612305, 6.30985164642334, 6.775027275085449, 7.240202903747559, 7.705378532409668, 8.170554161071777, 8.63572883605957, 9.10090446472168, 9.566080093383789, 10.031255722045898, 10.496431350708008, 10.961606979370117, 11.426782608032227, 11.891958236694336, 12.357133865356445, 12.822309494018555, 13.287484169006348, 13.752659797668457, 14.217835426330566]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 8.0, 9.0, 20.0, 34.0, 49.0, 64.0, 137.0, 205.0, 331.0, 639.0, 1040.0, 2258.0, 4523.0, 9081.0, 20066.0, 51971.0, 134535.0, 318247.0, 618199.0, 892942.0, 915797.0, 652851.0, 339516.0, 140571.0, 53363.0, 20456.0, 8722.0, 4109.0, 1982.0, 1059.0, 612.0, 308.0, 210.0, 122.0, 105.0, 41.0, 34.0, 23.0, 16.0, 9.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8857421875, -1.830322265625, -1.77490234375, -1.719482421875, -1.6640625, -1.608642578125, -1.55322265625, -1.497802734375, -1.4423828125, -1.386962890625, -1.33154296875, -1.276123046875, -1.220703125, -1.165283203125, -1.10986328125, -1.054443359375, -0.9990234375, -0.943603515625, -0.88818359375, -0.832763671875, -0.77734375, -0.721923828125, -0.66650390625, -0.611083984375, -0.5556640625, -0.500244140625, -0.44482421875, -0.389404296875, -0.333984375, -0.278564453125, -0.22314453125, -0.167724609375, -0.1123046875, -0.056884765625, -0.00146484375, 0.053955078125, 0.109375, 0.164794921875, 0.22021484375, 0.275634765625, 0.3310546875, 0.386474609375, 0.44189453125, 0.497314453125, 0.552734375, 0.608154296875, 0.66357421875, 0.718994140625, 0.7744140625, 0.829833984375, 0.88525390625, 0.940673828125, 0.99609375, 1.051513671875, 1.10693359375, 1.162353515625, 1.2177734375, 1.273193359375, 1.32861328125, 1.384033203125, 1.439453125, 1.494873046875, 1.55029296875, 1.605712890625, 1.6611328125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 17.0, 14.0, 14.0, 22.0, 24.0, 30.0, 39.0, 37.0, 34.0, 50.0, 46.0, 62.0, 49.0, 59.0, 50.0, 55.0, 52.0, 52.0, 43.0, 41.0, 38.0, 32.0, 31.0, 16.0, 17.0, 16.0, 9.0, 9.0, 7.0, 11.0, 4.0, 8.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.956756591796875, -1.87835693359375, -1.799957275390625, -1.7215576171875, -1.643157958984375, -1.56475830078125, -1.486358642578125, -1.407958984375, -1.329559326171875, -1.25115966796875, -1.172760009765625, -1.0943603515625, -1.015960693359375, -0.93756103515625, -0.859161376953125, -0.78076171875, -0.702362060546875, -0.62396240234375, -0.545562744140625, -0.4671630859375, -0.388763427734375, -0.31036376953125, -0.231964111328125, -0.153564453125, -0.075164794921875, 0.00323486328125, 0.081634521484375, 0.1600341796875, 0.238433837890625, 0.31683349609375, 0.395233154296875, 0.4736328125, 0.552032470703125, 0.63043212890625, 0.708831787109375, 0.7872314453125, 0.865631103515625, 0.94403076171875, 1.022430419921875, 1.100830078125, 1.179229736328125, 1.25762939453125, 1.336029052734375, 1.4144287109375, 1.492828369140625, 1.57122802734375, 1.649627685546875, 1.72802734375, 1.806427001953125, 1.88482666015625, 1.963226318359375, 2.0416259765625, 2.120025634765625, 2.19842529296875, 2.276824951171875, 2.355224609375, 2.433624267578125, 2.51202392578125, 2.590423583984375, 2.6688232421875, 2.747222900390625, 2.82562255859375, 2.904022216796875, 2.982421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 4.0, 10.0, 13.0, 14.0, 20.0, 25.0, 57.0, 97.0, 136.0, 260.0, 436.0, 858.0, 1810.0, 5905.0, 34006.0, 453494.0, 3226659.0, 429389.0, 32116.0, 5644.0, 1726.0, 739.0, 364.0, 184.0, 136.0, 74.0, 33.0, 24.0, 23.0, 9.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.18511962890625, -4.0069580078125, -3.82879638671875, -3.650634765625, -3.47247314453125, -3.2943115234375, -3.11614990234375, -2.93798828125, -2.75982666015625, -2.5816650390625, -2.40350341796875, -2.225341796875, -2.04718017578125, -1.8690185546875, -1.69085693359375, -1.5126953125, -1.33453369140625, -1.1563720703125, -0.97821044921875, -0.800048828125, -0.62188720703125, -0.4437255859375, -0.26556396484375, -0.08740234375, 0.09075927734375, 0.2689208984375, 0.44708251953125, 0.625244140625, 0.80340576171875, 0.9815673828125, 1.15972900390625, 1.337890625, 1.51605224609375, 1.6942138671875, 1.87237548828125, 2.050537109375, 2.22869873046875, 2.4068603515625, 2.58502197265625, 2.76318359375, 2.94134521484375, 3.1195068359375, 3.29766845703125, 3.475830078125, 3.65399169921875, 3.8321533203125, 4.01031494140625, 4.1884765625, 4.36663818359375, 4.5447998046875, 4.72296142578125, 4.901123046875, 5.07928466796875, 5.2574462890625, 5.43560791015625, 5.61376953125, 5.79193115234375, 5.9700927734375, 6.14825439453125, 6.326416015625, 6.50457763671875, 6.6827392578125, 6.86090087890625, 7.0390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 8.0, 13.0, 14.0, 20.0, 30.0, 49.0, 67.0, 109.0, 142.0, 200.0, 255.0, 317.0, 410.0, 450.0, 430.0, 372.0, 298.0, 246.0, 174.0, 136.0, 91.0, 85.0, 47.0, 28.0, 33.0, 10.0, 14.0, 14.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.585693359375, -4.44091796875, -4.296142578125, -4.1513671875, -4.006591796875, -3.86181640625, -3.717041015625, -3.572265625, -3.427490234375, -3.28271484375, -3.137939453125, -2.9931640625, -2.848388671875, -2.70361328125, -2.558837890625, -2.4140625, -2.269287109375, -2.12451171875, -1.979736328125, -1.8349609375, -1.690185546875, -1.54541015625, -1.400634765625, -1.255859375, -1.111083984375, -0.96630859375, -0.821533203125, -0.6767578125, -0.531982421875, -0.38720703125, -0.242431640625, -0.09765625, 0.047119140625, 0.19189453125, 0.336669921875, 0.4814453125, 0.626220703125, 0.77099609375, 0.915771484375, 1.060546875, 1.205322265625, 1.35009765625, 1.494873046875, 1.6396484375, 1.784423828125, 1.92919921875, 2.073974609375, 2.21875, 2.363525390625, 2.50830078125, 2.653076171875, 2.7978515625, 2.942626953125, 3.08740234375, 3.232177734375, 3.376953125, 3.521728515625, 3.66650390625, 3.811279296875, 3.9560546875, 4.100830078125, 4.24560546875, 4.390380859375, 4.53515625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 16.0, 21.0, 27.0, 42.0, 72.0, 107.0, 139.0, 132.0, 126.0, 99.0, 63.0, 43.0, 40.0, 28.0, 16.0, 4.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.61034393310547, -47.10532760620117, -45.600311279296875, -44.095298767089844, -42.59028244018555, -41.08526611328125, -39.58024978637695, -38.075233459472656, -36.570220947265625, -35.06520462036133, -33.56018829345703, -32.05517578125, -30.550159454345703, -29.045143127441406, -27.54012680053711, -26.035110473632812, -24.530094146728516, -23.02507781982422, -21.520063400268555, -20.015047073364258, -18.510032653808594, -17.005016326904297, -15.5, -13.99498462677002, -12.489969253540039, -10.984953880310059, -9.479938507080078, -7.974922180175781, -6.469906806945801, -4.96489143371582, -3.4598751068115234, -1.954859733581543, -0.4498481750488281, 1.0551674365997314, 2.560183048248291, 4.06519889831543, 5.57021427154541, 7.075229644775391, 8.580245971679688, 10.085261344909668, 11.590276718139648, 13.095292091369629, 14.60030746459961, 16.105323791503906, 17.610340118408203, 19.115354537963867, 20.620370864868164, 22.125385284423828, 23.630401611328125, 25.135417938232422, 26.640432357788086, 28.145448684692383, 29.650463104248047, 31.155479431152344, 32.66049575805664, 34.16551208496094, 35.67052459716797, 37.175540924072266, 38.68055725097656, 40.185569763183594, 41.69058609008789, 43.19560241699219, 44.700618743896484, 46.20563507080078, 47.71065139770508]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 7.0, 5.0, 4.0, 6.0, 7.0, 11.0, 13.0, 12.0, 15.0, 23.0, 23.0, 22.0, 28.0, 32.0, 42.0, 31.0, 32.0, 41.0, 43.0, 34.0, 36.0, 31.0, 44.0, 48.0, 35.0, 35.0, 47.0, 30.0, 35.0, 33.0, 28.0, 21.0, 24.0, 19.0, 18.0, 17.0, 14.0, 15.0, 6.0, 7.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-16.908281326293945, -16.39325523376465, -15.878228187561035, -15.363201141357422, -14.848175048828125, -14.333148956298828, -13.818121910095215, -13.303094863891602, -12.788068771362305, -12.273042678833008, -11.758015632629395, -11.242988586425781, -10.727962493896484, -10.212936401367188, -9.697909355163574, -9.182882308959961, -8.667856216430664, -8.152830123901367, -7.637803077697754, -7.122776508331299, -6.607749938964844, -6.092723369598389, -5.577696800231934, -5.0626702308654785, -4.547643661499023, -4.032617092132568, -3.5175905227661133, -3.002563953399658, -2.487537384033203, -1.972510814666748, -1.457484245300293, -0.9424576759338379, -0.42742919921875, 0.08759737014770508, 0.6026239395141602, 1.1176505088806152, 1.6326770782470703, 2.1477036476135254, 2.6627302169799805, 3.1777567863464355, 3.6927833557128906, 4.207809925079346, 4.722836494445801, 5.237863063812256, 5.752889633178711, 6.267916202545166, 6.782942771911621, 7.297969341278076, 7.812995910644531, 8.328022003173828, 8.843049049377441, 9.358076095581055, 9.873102188110352, 10.388128280639648, 10.903155326843262, 11.418182373046875, 11.933208465576172, 12.448234558105469, 12.963261604309082, 13.478288650512695, 13.993314743041992, 14.508340835571289, 15.023367881774902, 15.538394927978516, 16.053421020507812]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 10.0, 12.0, 12.0, 21.0, 20.0, 51.0, 64.0, 100.0, 184.0, 247.0, 551.0, 1071.0, 2371.0, 5723.0, 16302.0, 60108.0, 273446.0, 484918.0, 150535.0, 34789.0, 10506.0, 4015.0, 1705.0, 761.0, 443.0, 216.0, 119.0, 82.0, 50.0, 30.0, 24.0, 17.0, 16.0, 11.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.724609375, -2.6402587890625, -2.555908203125, -2.4715576171875, -2.38720703125, -2.3028564453125, -2.218505859375, -2.1341552734375, -2.0498046875, -1.9654541015625, -1.881103515625, -1.7967529296875, -1.71240234375, -1.6280517578125, -1.543701171875, -1.4593505859375, -1.375, -1.2906494140625, -1.206298828125, -1.1219482421875, -1.03759765625, -0.9532470703125, -0.868896484375, -0.7845458984375, -0.7001953125, -0.6158447265625, -0.531494140625, -0.4471435546875, -0.36279296875, -0.2784423828125, -0.194091796875, -0.1097412109375, -0.025390625, 0.0589599609375, 0.143310546875, 0.2276611328125, 0.31201171875, 0.3963623046875, 0.480712890625, 0.5650634765625, 0.6494140625, 0.7337646484375, 0.818115234375, 0.9024658203125, 0.98681640625, 1.0711669921875, 1.155517578125, 1.2398681640625, 1.32421875, 1.4085693359375, 1.492919921875, 1.5772705078125, 1.66162109375, 1.7459716796875, 1.830322265625, 1.9146728515625, 1.9990234375, 2.0833740234375, 2.167724609375, 2.2520751953125, 2.33642578125, 2.4207763671875, 2.505126953125, 2.5894775390625, 2.673828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 9.0, 7.0, 8.0, 12.0, 21.0, 25.0, 25.0, 20.0, 40.0, 33.0, 27.0, 42.0, 38.0, 46.0, 60.0, 62.0, 54.0, 47.0, 43.0, 58.0, 46.0, 38.0, 39.0, 31.0, 32.0, 26.0, 19.0, 20.0, 12.0, 18.0, 13.0, 9.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.125, -3.026214599609375, -2.92742919921875, -2.828643798828125, -2.7298583984375, -2.631072998046875, -2.53228759765625, -2.433502197265625, -2.334716796875, -2.235931396484375, -2.13714599609375, -2.038360595703125, -1.9395751953125, -1.840789794921875, -1.74200439453125, -1.643218994140625, -1.54443359375, -1.445648193359375, -1.34686279296875, -1.248077392578125, -1.1492919921875, -1.050506591796875, -0.95172119140625, -0.852935791015625, -0.754150390625, -0.655364990234375, -0.55657958984375, -0.457794189453125, -0.3590087890625, -0.260223388671875, -0.16143798828125, -0.062652587890625, 0.0361328125, 0.134918212890625, 0.23370361328125, 0.332489013671875, 0.4312744140625, 0.530059814453125, 0.62884521484375, 0.727630615234375, 0.826416015625, 0.925201416015625, 1.02398681640625, 1.122772216796875, 1.2215576171875, 1.320343017578125, 1.41912841796875, 1.517913818359375, 1.61669921875, 1.715484619140625, 1.81427001953125, 1.913055419921875, 2.0118408203125, 2.110626220703125, 2.20941162109375, 2.308197021484375, 2.406982421875, 2.505767822265625, 2.60455322265625, 2.703338623046875, 2.8021240234375, 2.900909423828125, 2.99969482421875, 3.098480224609375, 3.197265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 3.0, 6.0, 12.0, 17.0, 24.0, 15.0, 40.0, 53.0, 79.0, 153.0, 182.0, 308.0, 521.0, 989.0, 1872.0, 3988.0, 9173.0, 24768.0, 84715.0, 434852.0, 364803.0, 80686.0, 24245.0, 8972.0, 3868.0, 1810.0, 987.0, 538.0, 283.0, 194.0, 109.0, 90.0, 55.0, 43.0, 22.0, 24.0, 14.0, 14.0, 10.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0], "bins": [-2.734375, -2.65838623046875, -2.5823974609375, -2.50640869140625, -2.430419921875, -2.35443115234375, -2.2784423828125, -2.20245361328125, -2.12646484375, -2.05047607421875, -1.9744873046875, -1.89849853515625, -1.822509765625, -1.74652099609375, -1.6705322265625, -1.59454345703125, -1.5185546875, -1.44256591796875, -1.3665771484375, -1.29058837890625, -1.214599609375, -1.13861083984375, -1.0626220703125, -0.98663330078125, -0.91064453125, -0.83465576171875, -0.7586669921875, -0.68267822265625, -0.606689453125, -0.53070068359375, -0.4547119140625, -0.37872314453125, -0.302734375, -0.22674560546875, -0.1507568359375, -0.07476806640625, 0.001220703125, 0.07720947265625, 0.1531982421875, 0.22918701171875, 0.30517578125, 0.38116455078125, 0.4571533203125, 0.53314208984375, 0.609130859375, 0.68511962890625, 0.7611083984375, 0.83709716796875, 0.9130859375, 0.98907470703125, 1.0650634765625, 1.14105224609375, 1.217041015625, 1.29302978515625, 1.3690185546875, 1.44500732421875, 1.52099609375, 1.59698486328125, 1.6729736328125, 1.74896240234375, 1.824951171875, 1.90093994140625, 1.9769287109375, 2.05291748046875, 2.12890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 10.0, 9.0, 18.0, 18.0, 21.0, 29.0, 40.0, 37.0, 36.0, 44.0, 42.0, 59.0, 59.0, 68.0, 63.0, 44.0, 49.0, 43.0, 47.0, 47.0, 37.0, 31.0, 30.0, 18.0, 23.0, 14.0, 8.0, 9.0, 8.0, 2.0, 7.0, 4.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.5474853515625, -7.305908203125, -7.0643310546875, -6.82275390625, -6.5811767578125, -6.339599609375, -6.0980224609375, -5.8564453125, -5.6148681640625, -5.373291015625, -5.1317138671875, -4.89013671875, -4.6485595703125, -4.406982421875, -4.1654052734375, -3.923828125, -3.6822509765625, -3.440673828125, -3.1990966796875, -2.95751953125, -2.7159423828125, -2.474365234375, -2.2327880859375, -1.9912109375, -1.7496337890625, -1.508056640625, -1.2664794921875, -1.02490234375, -0.7833251953125, -0.541748046875, -0.3001708984375, -0.05859375, 0.1829833984375, 0.424560546875, 0.6661376953125, 0.90771484375, 1.1492919921875, 1.390869140625, 1.6324462890625, 1.8740234375, 2.1156005859375, 2.357177734375, 2.5987548828125, 2.84033203125, 3.0819091796875, 3.323486328125, 3.5650634765625, 3.806640625, 4.0482177734375, 4.289794921875, 4.5313720703125, 4.77294921875, 5.0145263671875, 5.256103515625, 5.4976806640625, 5.7392578125, 5.9808349609375, 6.222412109375, 6.4639892578125, 6.70556640625, 6.9471435546875, 7.188720703125, 7.4302978515625, 7.671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 1.0, 8.0, 19.0, 18.0, 29.0, 57.0, 65.0, 124.0, 217.0, 421.0, 958.0, 2697.0, 10459.0, 84935.0, 831366.0, 100837.0, 11540.0, 2857.0, 933.0, 425.0, 228.0, 137.0, 75.0, 44.0, 35.0, 21.0, 14.0, 12.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.26708984375, -1.2255859375, -1.18408203125, -1.142578125, -1.10107421875, -1.0595703125, -1.01806640625, -0.9765625, -0.93505859375, -0.8935546875, -0.85205078125, -0.810546875, -0.76904296875, -0.7275390625, -0.68603515625, -0.64453125, -0.60302734375, -0.5615234375, -0.52001953125, -0.478515625, -0.43701171875, -0.3955078125, -0.35400390625, -0.3125, -0.27099609375, -0.2294921875, -0.18798828125, -0.146484375, -0.10498046875, -0.0634765625, -0.02197265625, 0.01953125, 0.06103515625, 0.1025390625, 0.14404296875, 0.185546875, 0.22705078125, 0.2685546875, 0.31005859375, 0.3515625, 0.39306640625, 0.4345703125, 0.47607421875, 0.517578125, 0.55908203125, 0.6005859375, 0.64208984375, 0.68359375, 0.72509765625, 0.7666015625, 0.80810546875, 0.849609375, 0.89111328125, 0.9326171875, 0.97412109375, 1.015625, 1.05712890625, 1.0986328125, 1.14013671875, 1.181640625, 1.22314453125, 1.2646484375, 1.30615234375, 1.34765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 7.0, 9.0, 8.0, 14.0, 20.0, 28.0, 48.0, 54.0, 71.0, 104.0, 86.0, 120.0, 119.0, 79.0, 53.0, 36.0, 36.0, 20.0, 18.0, 17.0, 11.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023090839385986328, -0.00022430531680583954, -0.0002177022397518158, -0.00021109916269779205, -0.0002044960856437683, -0.00019789300858974457, -0.00019128993153572083, -0.00018468685448169708, -0.00017808377742767334, -0.0001714807003736496, -0.00016487762331962585, -0.0001582745462656021, -0.00015167146921157837, -0.00014506839215755463, -0.00013846531510353088, -0.00013186223804950714, -0.0001252591609954834, -0.00011865608394145966, -0.00011205300688743591, -0.00010544992983341217, -9.884685277938843e-05, -9.224377572536469e-05, -8.564069867134094e-05, -7.90376216173172e-05, -7.243454456329346e-05, -6.583146750926971e-05, -5.922839045524597e-05, -5.262531340122223e-05, -4.6022236347198486e-05, -3.9419159293174744e-05, -3.2816082239151e-05, -2.6213005185127258e-05, -1.9609928131103516e-05, -1.3006851077079773e-05, -6.40377402305603e-06, 1.993030309677124e-07, 6.802380084991455e-06, 1.3405457139015198e-05, 2.000853419303894e-05, 2.6611611247062683e-05, 3.3214688301086426e-05, 3.981776535511017e-05, 4.642084240913391e-05, 5.3023919463157654e-05, 5.9626996517181396e-05, 6.623007357120514e-05, 7.283315062522888e-05, 7.943622767925262e-05, 8.603930473327637e-05, 9.264238178730011e-05, 9.924545884132385e-05, 0.0001058485358953476, 0.00011245161294937134, 0.00011905469000339508, 0.00012565776705741882, 0.00013226084411144257, 0.0001388639211654663, 0.00014546699821949005, 0.0001520700752735138, 0.00015867315232753754, 0.00016527622938156128, 0.00017187930643558502, 0.00017848238348960876, 0.0001850854605436325, 0.00019168853759765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 15.0, 14.0, 15.0, 33.0, 42.0, 58.0, 108.0, 162.0, 273.0, 441.0, 1045.0, 2955.0, 12955.0, 105655.0, 788097.0, 116789.0, 14147.0, 3312.0, 1135.0, 517.0, 268.0, 160.0, 118.0, 73.0, 39.0, 25.0, 27.0, 17.0, 15.0, 7.0, 3.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.228515625, -1.1854400634765625, -1.142364501953125, -1.0992889404296875, -1.05621337890625, -1.0131378173828125, -0.970062255859375, -0.9269866943359375, -0.8839111328125, -0.8408355712890625, -0.797760009765625, -0.7546844482421875, -0.71160888671875, -0.6685333251953125, -0.625457763671875, -0.5823822021484375, -0.539306640625, -0.4962310791015625, -0.453155517578125, -0.4100799560546875, -0.36700439453125, -0.3239288330078125, -0.280853271484375, -0.2377777099609375, -0.1947021484375, -0.1516265869140625, -0.108551025390625, -0.0654754638671875, -0.02239990234375, 0.0206756591796875, 0.063751220703125, 0.1068267822265625, 0.14990234375, 0.1929779052734375, 0.236053466796875, 0.2791290283203125, 0.32220458984375, 0.3652801513671875, 0.408355712890625, 0.4514312744140625, 0.4945068359375, 0.5375823974609375, 0.580657958984375, 0.6237335205078125, 0.66680908203125, 0.7098846435546875, 0.752960205078125, 0.7960357666015625, 0.839111328125, 0.8821868896484375, 0.925262451171875, 0.9683380126953125, 1.01141357421875, 1.0544891357421875, 1.097564697265625, 1.1406402587890625, 1.1837158203125, 1.2267913818359375, 1.269866943359375, 1.3129425048828125, 1.35601806640625, 1.3990936279296875, 1.442169189453125, 1.4852447509765625, 1.5283203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 5.0, 4.0, 9.0, 9.0, 7.0, 9.0, 10.0, 14.0, 9.0, 14.0, 21.0, 28.0, 24.0, 43.0, 57.0, 66.0, 69.0, 90.0, 74.0, 98.0, 69.0, 51.0, 46.0, 30.0, 23.0, 25.0, 13.0, 8.0, 9.0, 11.0, 11.0, 3.0, 7.0, 6.0, 5.0, 0.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.99267578125, -0.9608383178710938, -0.9290008544921875, -0.8971633911132812, -0.865325927734375, -0.8334884643554688, -0.8016510009765625, -0.7698135375976562, -0.73797607421875, -0.7061386108398438, -0.6743011474609375, -0.6424636840820312, -0.610626220703125, -0.5787887573242188, -0.5469512939453125, -0.5151138305664062, -0.4832763671875, -0.45143890380859375, -0.4196014404296875, -0.38776397705078125, -0.355926513671875, -0.32408905029296875, -0.2922515869140625, -0.26041412353515625, -0.22857666015625, -0.19673919677734375, -0.1649017333984375, -0.13306427001953125, -0.101226806640625, -0.06938934326171875, -0.0375518798828125, -0.00571441650390625, 0.026123046875, 0.05796051025390625, 0.0897979736328125, 0.12163543701171875, 0.153472900390625, 0.18531036376953125, 0.2171478271484375, 0.24898529052734375, 0.28082275390625, 0.31266021728515625, 0.3444976806640625, 0.37633514404296875, 0.408172607421875, 0.44001007080078125, 0.4718475341796875, 0.5036849975585938, 0.5355224609375, 0.5673599243164062, 0.5991973876953125, 0.6310348510742188, 0.662872314453125, 0.6947097778320312, 0.7265472412109375, 0.7583847045898438, 0.79022216796875, 0.8220596313476562, 0.8538970947265625, 0.8857345581054688, 0.917572021484375, 0.9494094848632812, 0.9812469482421875, 1.0130844116210938, 1.044921875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 16.0, 19.0, 23.0, 56.0, 101.0, 147.0, 209.0, 161.0, 113.0, 62.0, 37.0, 14.0, 16.0, 7.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8845157623291, -20.003063201904297, -19.121610641479492, -18.240158081054688, -17.358705520629883, -16.477252960205078, -15.595800399780273, -14.714347839355469, -13.832895278930664, -12.95144271850586, -12.069990158081055, -11.18853759765625, -10.307085037231445, -9.42563247680664, -8.544179916381836, -7.662727355957031, -6.781274795532227, -5.899822235107422, -5.018369674682617, -4.1369171142578125, -3.255464553833008, -2.374011993408203, -1.4925594329833984, -0.6111068725585938, 0.27034568786621094, 1.1517982482910156, 2.0332508087158203, 2.914703369140625, 3.7961559295654297, 4.677608489990234, 5.559061050415039, 6.440513610839844, 7.321968078613281, 8.203420639038086, 9.08487319946289, 9.966325759887695, 10.8477783203125, 11.729230880737305, 12.61068344116211, 13.492136001586914, 14.373588562011719, 15.255041122436523, 16.136493682861328, 17.017946243286133, 17.899398803710938, 18.780851364135742, 19.662303924560547, 20.54375648498535, 21.425209045410156, 22.30666160583496, 23.188114166259766, 24.06956672668457, 24.951019287109375, 25.83247184753418, 26.713924407958984, 27.59537696838379, 28.476829528808594, 29.3582820892334, 30.239734649658203, 31.121187210083008, 32.00263977050781, 32.88409423828125, 33.76554489135742, 34.646995544433594, 35.52845001220703]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 8.0, 10.0, 13.0, 18.0, 20.0, 26.0, 29.0, 26.0, 33.0, 35.0, 54.0, 68.0, 82.0, 90.0, 88.0, 52.0, 51.0, 41.0, 46.0, 44.0, 24.0, 33.0, 19.0, 15.0, 13.0, 14.0, 13.0, 9.0, 7.0, 2.0, 1.0, 8.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.42766571044922, -23.746395111083984, -23.06512451171875, -22.383852005004883, -21.70258140563965, -21.021310806274414, -20.34004020690918, -19.658767700195312, -18.977497100830078, -18.296226501464844, -17.61495590209961, -16.933683395385742, -16.252412796020508, -15.571142196655273, -14.889871597290039, -14.208600044250488, -13.527329444885254, -12.84605884552002, -12.164787292480469, -11.483516693115234, -10.802245140075684, -10.12097454071045, -9.439702987670898, -8.758432388305664, -8.07716178894043, -7.395890712738037, -6.7146196365356445, -6.03334903717041, -5.352077484130859, -4.670806884765625, -3.9895358085632324, -3.30826473236084, -2.626993179321289, -1.9457221031188965, -1.2644511461257935, -0.5831801891326904, 0.09809088706970215, 0.7793619632720947, 1.4606328010559082, 2.141903877258301, 2.8231749534606934, 3.504446029663086, 4.1857171058654785, 4.866988182067871, 5.5482587814331055, 6.229530334472656, 6.910800933837891, 7.592072010040283, 8.273343086242676, 8.95461368560791, 9.635885238647461, 10.317155838012695, 10.998427391052246, 11.67969799041748, 12.360969543457031, 13.042240142822266, 13.7235107421875, 14.404781341552734, 15.086052894592285, 15.76732349395752, 16.44859504699707, 17.129865646362305, 17.81113624572754, 18.492408752441406, 19.17367935180664]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 4.0, 6.0, 9.0, 7.0, 12.0, 15.0, 15.0, 15.0, 14.0, 18.0, 24.0, 16.0, 34.0, 41.0, 68.0, 179.0, 199.0, 78.0, 45.0, 31.0, 31.0, 25.0, 22.0, 24.0, 15.0, 12.0, 12.0, 6.0, 3.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.11322021484375, -2.0174560546875, -1.92169189453125, -1.825927734375, -1.73016357421875, -1.6343994140625, -1.53863525390625, -1.44287109375, -1.34710693359375, -1.2513427734375, -1.15557861328125, -1.059814453125, -0.96405029296875, -0.8682861328125, -0.77252197265625, -0.6767578125, -0.58099365234375, -0.4852294921875, -0.38946533203125, -0.293701171875, -0.19793701171875, -0.1021728515625, -0.00640869140625, 0.08935546875, 0.18511962890625, 0.2808837890625, 0.37664794921875, 0.472412109375, 0.56817626953125, 0.6639404296875, 0.75970458984375, 0.85546875, 0.95123291015625, 1.0469970703125, 1.14276123046875, 1.238525390625, 1.33428955078125, 1.4300537109375, 1.52581787109375, 1.62158203125, 1.71734619140625, 1.8131103515625, 1.90887451171875, 2.004638671875, 2.10040283203125, 2.1961669921875, 2.29193115234375, 2.3876953125, 2.48345947265625, 2.5792236328125, 2.67498779296875, 2.770751953125, 2.86651611328125, 2.9622802734375, 3.05804443359375, 3.15380859375, 3.24957275390625, 3.3453369140625, 3.44110107421875, 3.536865234375, 3.63262939453125, 3.7283935546875, 3.82415771484375, 3.919921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 3.0, 8.0, 7.0, 4.0, 9.0, 6.0, 16.0, 21.0, 30.0, 62.0, 62.0, 121.0, 188.0, 290.0, 556.0, 1105.0, 2347.0, 5733.0, 18648.0, 7712430.0, 621108.0, 15993.0, 5171.0, 2158.0, 1051.0, 562.0, 297.0, 197.0, 128.0, 71.0, 50.0, 44.0, 30.0, 23.0, 13.0, 12.0, 7.0, 11.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-9.680540084838867, -9.425344467163086, -9.170148849487305, -8.91495418548584, -8.659758567810059, -8.404562950134277, -8.149367332458496, -7.894171714782715, -7.638976573944092, -7.3837809562683105, -7.1285858154296875, -6.873390197753906, -6.618194580078125, -6.362999439239502, -6.107803821563721, -5.852608680725098, -5.597413063049316, -5.342217445373535, -5.087022304534912, -4.831826686859131, -4.576631546020508, -4.321435928344727, -4.066240310668945, -3.811044931411743, -3.555849552154541, -3.300654172897339, -3.0454587936401367, -2.7902631759643555, -2.5350677967071533, -2.279872417449951, -2.02467679977417, -1.7694814205169678, -1.5142860412597656, -1.2590906620025635, -1.0038951635360718, -0.7486997246742249, -0.49350428581237793, -0.23830890655517578, 0.016886591911315918, 0.2720820903778076, 0.5272774696350098, 0.7824729084968567, 1.0376683473587036, 1.2928638458251953, 1.5480592250823975, 1.8032546043395996, 2.058450222015381, 2.313645601272583, 2.568840980529785, 2.8240363597869873, 3.0792317390441895, 3.3344273567199707, 3.589622735977173, 3.844818115234375, 4.100013732910156, 4.3552093505859375, 4.6104044914245605, 4.865600109100342, 5.120795249938965, 5.375990867614746, 5.631186485290527, 5.88638162612915, 6.141577243804932, 6.396772384643555, 6.651968002319336]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 3.0, 7.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 7.0, 3.0, 0.0, 6.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.560235977172852, -13.227935791015625, -12.895635604858398, -12.563334465026855, -12.231034278869629, -11.898734092712402, -11.56643295288086, -11.234132766723633, -10.901832580566406, -10.56953239440918, -10.237232208251953, -9.90493106842041, -9.572630882263184, -9.240330696105957, -8.908029556274414, -8.575729370117188, -8.243429183959961, -7.911128997802734, -7.57882833480835, -7.246527671813965, -6.914227485656738, -6.581927299499512, -6.249626636505127, -5.917325973510742, -5.585025787353516, -5.252725601196289, -4.920424938201904, -4.5881242752075195, -4.255824089050293, -3.9235236644744873, -3.5912232398986816, -3.258922815322876, -2.9266233444213867, -2.594322919845581, -2.2620224952697754, -1.9297220706939697, -1.597421646118164, -1.2651212215423584, -0.9328207969665527, -0.6005203723907471, -0.2682199478149414, 0.06408047676086426, 0.3963809013366699, 0.7286813259124756, 1.0609817504882812, 1.393282175064087, 1.7255825996398926, 2.0578830242156982, 2.390183448791504, 2.7224838733673096, 3.0547842979431152, 3.387084722518921, 3.7193851470947266, 4.051685333251953, 4.383985996246338, 4.716286659240723, 5.048586845397949, 5.380887031555176, 5.7131876945495605, 6.045488357543945, 6.377788543701172, 6.710088729858398, 7.042389392852783, 7.374690055847168, 7.7069902420043945]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 9.0, 14.0, 9.0, 17.0, 22.0, 21.0, 36.0, 49.0, 38.0, 40.0, 50.0, 54.0, 62.0, 67.0, 50.0, 68.0, 43.0, 54.0, 49.0, 41.0, 42.0, 31.0, 28.0, 20.0, 20.0, 13.0, 11.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6775970458984375, -1.615936279296875, -1.5542755126953125, -1.49261474609375, -1.4309539794921875, -1.369293212890625, -1.3076324462890625, -1.2459716796875, -1.1843109130859375, -1.122650146484375, -1.0609893798828125, -0.99932861328125, -0.9376678466796875, -0.876007080078125, -0.8143463134765625, -0.752685546875, -0.6910247802734375, -0.629364013671875, -0.5677032470703125, -0.50604248046875, -0.4443817138671875, -0.382720947265625, -0.3210601806640625, -0.2593994140625, -0.1977386474609375, -0.136077880859375, -0.0744171142578125, -0.01275634765625, 0.0489044189453125, 0.110565185546875, 0.1722259521484375, 0.23388671875, 0.2955474853515625, 0.357208251953125, 0.4188690185546875, 0.48052978515625, 0.5421905517578125, 0.603851318359375, 0.6655120849609375, 0.7271728515625, 0.7888336181640625, 0.850494384765625, 0.9121551513671875, 0.97381591796875, 1.0354766845703125, 1.097137451171875, 1.1587982177734375, 1.220458984375, 1.2821197509765625, 1.343780517578125, 1.4054412841796875, 1.46710205078125, 1.5287628173828125, 1.590423583984375, 1.6520843505859375, 1.7137451171875, 1.7754058837890625, 1.837066650390625, 1.8987274169921875, 1.96038818359375, 2.0220489501953125, 2.083709716796875, 2.1453704833984375, 2.20703125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 7.0, 15.0, 16.0, 29.0, 37.0, 38.0, 54.0, 86.0, 111.0, 167.0, 237.0, 386.0, 562.0, 900.0, 1435.0, 2421.0, 4320.0, 8164.0, 16082.0, 37164.0, 108040.0, 194094.0, 86599.0, 31541.0, 14412.0, 7271.0, 4041.0, 2272.0, 1291.0, 792.0, 524.0, 330.0, 243.0, 169.0, 113.0, 77.0, 62.0, 36.0, 25.0, 19.0, 17.0, 13.0, 11.0, 5.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.5, -23.719970703125, -22.93994140625, -22.159912109375, -21.3798828125, -20.599853515625, -19.81982421875, -19.039794921875, -18.259765625, -17.479736328125, -16.69970703125, -15.919677734375, -15.1396484375, -14.359619140625, -13.57958984375, -12.799560546875, -12.01953125, -11.239501953125, -10.45947265625, -9.679443359375, -8.8994140625, -8.119384765625, -7.33935546875, -6.559326171875, -5.779296875, -4.999267578125, -4.21923828125, -3.439208984375, -2.6591796875, -1.879150390625, -1.09912109375, -0.319091796875, 0.4609375, 1.240966796875, 2.02099609375, 2.801025390625, 3.5810546875, 4.361083984375, 5.14111328125, 5.921142578125, 6.701171875, 7.481201171875, 8.26123046875, 9.041259765625, 9.8212890625, 10.601318359375, 11.38134765625, 12.161376953125, 12.94140625, 13.721435546875, 14.50146484375, 15.281494140625, 16.0615234375, 16.841552734375, 17.62158203125, 18.401611328125, 19.181640625, 19.961669921875, 20.74169921875, 21.521728515625, 22.3017578125, 23.081787109375, 23.86181640625, 24.641845703125, 25.421875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 4.0, 7.0, 14.0, 19.0, 17.0, 21.0, 35.0, 28.0, 42.0, 37.0, 37.0, 50.0, 35.0, 58.0, 52.0, 49.0, 50.0, 46.0, 45.0, 50.0, 42.0, 50.0, 24.0, 31.0, 32.0, 18.0, 17.0, 10.0, 6.0, 16.0, 11.0, 6.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.431640625, -2.346435546875, -2.26123046875, -2.176025390625, -2.0908203125, -2.005615234375, -1.92041015625, -1.835205078125, -1.75, -1.664794921875, -1.57958984375, -1.494384765625, -1.4091796875, -1.323974609375, -1.23876953125, -1.153564453125, -1.068359375, -0.983154296875, -0.89794921875, -0.812744140625, -0.7275390625, -0.642333984375, -0.55712890625, -0.471923828125, -0.38671875, -0.301513671875, -0.21630859375, -0.131103515625, -0.0458984375, 0.039306640625, 0.12451171875, 0.209716796875, 0.294921875, 0.380126953125, 0.46533203125, 0.550537109375, 0.6357421875, 0.720947265625, 0.80615234375, 0.891357421875, 0.9765625, 1.061767578125, 1.14697265625, 1.232177734375, 1.3173828125, 1.402587890625, 1.48779296875, 1.572998046875, 1.658203125, 1.743408203125, 1.82861328125, 1.913818359375, 1.9990234375, 2.084228515625, 2.16943359375, 2.254638671875, 2.33984375, 2.425048828125, 2.51025390625, 2.595458984375, 2.6806640625, 2.765869140625, 2.85107421875, 2.936279296875, 3.021484375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 5.0, 12.0, 5.0, 30.0, 39.0, 55.0, 73.0, 79.0, 64.0, 32.0, 25.0, 12.0, 8.0, 10.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.080479621887207, -10.668635368347168, -10.256791114807129, -9.84494686126709, -9.433103561401367, -9.021259307861328, -8.609415054321289, -8.19757080078125, -7.785726547241211, -7.373882293701172, -6.962038040161133, -6.550194263458252, -6.138350009918213, -5.726505756378174, -5.314661979675293, -4.902817726135254, -4.490973472595215, -4.079129219055176, -3.667285203933716, -3.255441188812256, -2.843596935272217, -2.4317526817321777, -2.0199086666107178, -1.6080646514892578, -1.1962203979492188, -0.7843762636184692, -0.3725321292877197, 0.039312005043029785, 0.4511561393737793, 0.8630003929138184, 1.2748444080352783, 1.6866884231567383, 2.098531723022461, 2.5103759765625, 2.92221999168396, 3.33406400680542, 3.745908260345459, 4.157752513885498, 4.569596290588379, 4.981440544128418, 5.393284797668457, 5.805129051208496, 6.216973304748535, 6.628817081451416, 7.040661334991455, 7.452505588531494, 7.864349365234375, 8.276193618774414, 8.688037872314453, 9.099882125854492, 9.511726379394531, 9.92357063293457, 10.33541488647461, 10.747259140014648, 11.159102439880371, 11.57094669342041, 11.98279094696045, 12.394635200500488, 12.806479454040527, 13.218323707580566, 13.630167007446289, 14.042011260986328, 14.453855514526367, 14.865699768066406, 15.277544021606445]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 5.0, 9.0, 9.0, 11.0, 13.0, 12.0, 22.0, 40.0, 91.0, 116.0, 35.0, 21.0, 16.0, 10.0, 7.0, 14.0, 11.0, 4.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.910449981689453, -11.47547721862793, -11.040504455566406, -10.605531692504883, -10.17055892944336, -9.735586166381836, -9.300613403320312, -8.865640640258789, -8.430667877197266, -7.995695114135742, -7.560722351074219, -7.125749588012695, -6.690776824951172, -6.255804061889648, -5.820830821990967, -5.385858058929443, -4.950884819030762, -4.515912055969238, -4.080939292907715, -3.6459662914276123, -3.210993528366089, -2.7760207653045654, -2.341047763824463, -1.9060750007629395, -1.471102237701416, -1.0361294746398926, -0.6011565923690796, -0.1661837100982666, 0.26878905296325684, 0.7037618160247803, 1.1387348175048828, 1.5737075805664062, 2.0086793899536133, 2.4436521530151367, 2.87862491607666, 3.3135979175567627, 3.748570680618286, 4.1835432052612305, 4.618516445159912, 5.0534892082214355, 5.488461971282959, 5.923434734344482, 6.358407497406006, 6.7933807373046875, 7.228353500366211, 7.663326263427734, 8.098299026489258, 8.533271789550781, 8.968244552612305, 9.403217315673828, 9.838190078735352, 10.273162841796875, 10.708135604858398, 11.143108367919922, 11.578081130981445, 12.013053894042969, 12.448026657104492, 12.882999420166016, 13.317972183227539, 13.752944946289062, 14.187917709350586, 14.62289047241211, 15.057863235473633, 15.492835998535156, 15.927809715270996]}, "eval/loss": 1.642454743385315, "eval/bleu": 2.691896075803751e-15, "eval/runtime": 2632.4174, "eval/samples_per_second": 5.607, "eval/steps_per_second": 0.701, "train/train_runtime": 95217.2299, "train/train_samples_per_second": 6.534, "train/train_steps_per_second": 0.102, "train/total_flos": 0.0, "train/train_loss": 1.7970677693255643} \ No newline at end of file +{"train/loss": 0.4724, "train/learning_rate": 1.0702900088061256e-07, "train/epoch": 3.0, "train/global_step": 9720, "_runtime": 95217, "_timestamp": 1651769306, "_step": 9739, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 16.0, 47.0, 105.0, 194.0, 255.0, 200.0, 126.0, 40.0, 24.0, 5.0], "bins": [-38.22578811645508, -37.57297134399414, -36.9201545715332, -36.267337799072266, -35.61452102661133, -34.961700439453125, -34.30888366699219, -33.65606689453125, -33.00325012207031, -32.350433349609375, -31.697616577148438, -31.044797897338867, -30.39198112487793, -29.739164352416992, -29.086347579956055, -28.433530807495117, -27.78071403503418, -27.127897262573242, -26.475080490112305, -25.822261810302734, -25.169445037841797, -24.51662826538086, -23.863811492919922, -23.210994720458984, -22.558177947998047, -21.90536117553711, -21.252544403076172, -20.5997257232666, -19.946908950805664, -19.294092178344727, -18.64127540588379, -17.98845863342285, -17.33563804626465, -16.68282127380371, -16.030004501342773, -15.37718677520752, -14.724369049072266, -14.071552276611328, -13.41873550415039, -12.765918731689453, -12.1131010055542, -11.460284233093262, -10.807466506958008, -10.15464973449707, -9.501832962036133, -8.849015235900879, -8.196198463439941, -7.543381214141846, -6.89056396484375, -6.237746715545654, -5.584929466247559, -4.932112693786621, -4.279295444488525, -3.6264781951904297, -2.973661184310913, -2.3208441734313965, -1.6680269241333008, -1.0152097940444946, -0.3623926639556885, 0.2904244661331177, 0.9432415962219238, 1.5960588455200195, 2.248875856399536, 2.9016928672790527, 3.5545101165771484]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 9.0, 6.0, 5.0, 8.0, 10.0, 14.0, 12.0, 17.0, 19.0, 16.0, 30.0, 19.0, 19.0, 31.0, 38.0, 32.0, 37.0, 53.0, 43.0, 41.0, 36.0, 33.0, 34.0, 23.0, 42.0, 37.0, 39.0, 41.0, 31.0, 31.0, 25.0, 25.0, 24.0, 22.0, 15.0, 19.0, 16.0, 4.0, 10.0, 12.0, 5.0, 7.0, 4.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76909065246582, -5.58101749420166, -5.3929443359375, -5.204871654510498, -5.016798496246338, -4.828725337982178, -4.640652179718018, -4.452579498291016, -4.2645063400268555, -4.076433181762695, -3.8883602619171143, -3.700287103652954, -3.512214183807373, -3.324141025543213, -3.1360678672790527, -2.9479949474334717, -2.7599217891693115, -2.5718486309051514, -2.3837757110595703, -2.19570255279541, -2.007629632949829, -1.819556474685669, -1.6314834356307983, -1.4434103965759277, -1.2553373575210571, -1.0672643184661865, -0.8791912794113159, -0.6911181807518005, -0.5030451416969299, -0.3149721026420593, -0.12689900398254395, 0.06117403507232666, 0.24924707412719727, 0.43732011318206787, 0.6253931522369385, 0.8134662508964539, 1.0015392303466797, 1.1896123886108398, 1.3776854276657104, 1.565758466720581, 1.7538315057754517, 1.9419045448303223, 2.1299777030944824, 2.3180506229400635, 2.5061237812042236, 2.6941967010498047, 2.882269859313965, 3.070343017578125, 3.258415937423706, 3.446489095687866, 3.6345620155334473, 3.8226351737976074, 4.010708332061768, 4.1987810134887695, 4.38685417175293, 4.57492733001709, 4.76300048828125, 4.95107364654541, 5.13914680480957, 5.327219486236572, 5.515292644500732, 5.703365802764893, 5.891438961029053, 6.079511642456055, 6.267584800720215]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 8.0, 9.0, 17.0, 18.0, 18.0, 31.0, 47.0, 70.0, 99.0, 157.0, 276.0, 414.0, 723.0, 1148.0, 2051.0, 3603.0, 6965.0, 14656.0, 34925.0, 106300.0, 379896.0, 1294548.0, 1630173.0, 498712.0, 140514.0, 43605.0, 17353.0, 8163.0, 4141.0, 2187.0, 1342.0, 825.0, 437.0, 297.0, 172.0, 125.0, 59.0, 62.0, 25.0, 33.0, 19.0, 16.0, 14.0, 8.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.5, -11.141845703125, -10.78369140625, -10.425537109375, -10.0673828125, -9.709228515625, -9.35107421875, -8.992919921875, -8.634765625, -8.276611328125, -7.91845703125, -7.560302734375, -7.2021484375, -6.843994140625, -6.48583984375, -6.127685546875, -5.76953125, -5.411376953125, -5.05322265625, -4.695068359375, -4.3369140625, -3.978759765625, -3.62060546875, -3.262451171875, -2.904296875, -2.546142578125, -2.18798828125, -1.829833984375, -1.4716796875, -1.113525390625, -0.75537109375, -0.397216796875, -0.0390625, 0.319091796875, 0.67724609375, 1.035400390625, 1.3935546875, 1.751708984375, 2.10986328125, 2.468017578125, 2.826171875, 3.184326171875, 3.54248046875, 3.900634765625, 4.2587890625, 4.616943359375, 4.97509765625, 5.333251953125, 5.69140625, 6.049560546875, 6.40771484375, 6.765869140625, 7.1240234375, 7.482177734375, 7.84033203125, 8.198486328125, 8.556640625, 8.914794921875, 9.27294921875, 9.631103515625, 9.9892578125, 10.347412109375, 10.70556640625, 11.063720703125, 11.421875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 6.0, 4.0, 3.0, 2.0, 7.0, 10.0, 14.0, 11.0, 23.0, 12.0, 12.0, 32.0, 24.0, 16.0, 18.0, 32.0, 21.0, 33.0, 36.0, 34.0, 43.0, 37.0, 40.0, 36.0, 29.0, 42.0, 41.0, 30.0, 34.0, 30.0, 36.0, 31.0, 20.0, 28.0, 22.0, 28.0, 12.0, 18.0, 17.0, 11.0, 12.0, 13.0, 9.0, 12.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-8.90625, -8.6258544921875, -8.345458984375, -8.0650634765625, -7.78466796875, -7.5042724609375, -7.223876953125, -6.9434814453125, -6.6630859375, -6.3826904296875, -6.102294921875, -5.8218994140625, -5.54150390625, -5.2611083984375, -4.980712890625, -4.7003173828125, -4.419921875, -4.1395263671875, -3.859130859375, -3.5787353515625, -3.29833984375, -3.0179443359375, -2.737548828125, -2.4571533203125, -2.1767578125, -1.8963623046875, -1.615966796875, -1.3355712890625, -1.05517578125, -0.7747802734375, -0.494384765625, -0.2139892578125, 0.06640625, 0.3468017578125, 0.627197265625, 0.9075927734375, 1.18798828125, 1.4683837890625, 1.748779296875, 2.0291748046875, 2.3095703125, 2.5899658203125, 2.870361328125, 3.1507568359375, 3.43115234375, 3.7115478515625, 3.991943359375, 4.2723388671875, 4.552734375, 4.8331298828125, 5.113525390625, 5.3939208984375, 5.67431640625, 5.9547119140625, 6.235107421875, 6.5155029296875, 6.7958984375, 7.0762939453125, 7.356689453125, 7.6370849609375, 7.91748046875, 8.1978759765625, 8.478271484375, 8.7586669921875, 9.0390625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 11.0, 18.0, 23.0, 48.0, 42.0, 73.0, 99.0, 137.0, 238.0, 620.0, 18574.0, 4170474.0, 2838.0, 468.0, 214.0, 125.0, 79.0, 69.0, 34.0, 21.0, 14.0, 10.0, 6.0, 8.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-117.5, -113.3515625, -109.203125, -105.0546875, -100.90625, -96.7578125, -92.609375, -88.4609375, -84.3125, -80.1640625, -76.015625, -71.8671875, -67.71875, -63.5703125, -59.421875, -55.2734375, -51.125, -46.9765625, -42.828125, -38.6796875, -34.53125, -30.3828125, -26.234375, -22.0859375, -17.9375, -13.7890625, -9.640625, -5.4921875, -1.34375, 2.8046875, 6.953125, 11.1015625, 15.25, 19.3984375, 23.546875, 27.6953125, 31.84375, 35.9921875, 40.140625, 44.2890625, 48.4375, 52.5859375, 56.734375, 60.8828125, 65.03125, 69.1796875, 73.328125, 77.4765625, 81.625, 85.7734375, 89.921875, 94.0703125, 98.21875, 102.3671875, 106.515625, 110.6640625, 114.8125, 118.9609375, 123.109375, 127.2578125, 131.40625, 135.5546875, 139.703125, 143.8515625, 148.0]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 19.0, 16.0, 24.0, 36.0, 45.0, 55.0, 84.0, 113.0, 144.0, 234.0, 412.0, 850.0, 769.0, 452.0, 251.0, 163.0, 112.0, 80.0, 45.0, 39.0, 34.0, 21.0, 8.0, 11.0, 2.0, 6.0, 6.0, 7.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.49609375, -4.341064453125, -4.18603515625, -4.031005859375, -3.8759765625, -3.720947265625, -3.56591796875, -3.410888671875, -3.255859375, -3.100830078125, -2.94580078125, -2.790771484375, -2.6357421875, -2.480712890625, -2.32568359375, -2.170654296875, -2.015625, -1.860595703125, -1.70556640625, -1.550537109375, -1.3955078125, -1.240478515625, -1.08544921875, -0.930419921875, -0.775390625, -0.620361328125, -0.46533203125, -0.310302734375, -0.1552734375, -0.000244140625, 0.15478515625, 0.309814453125, 0.46484375, 0.619873046875, 0.77490234375, 0.929931640625, 1.0849609375, 1.239990234375, 1.39501953125, 1.550048828125, 1.705078125, 1.860107421875, 2.01513671875, 2.170166015625, 2.3251953125, 2.480224609375, 2.63525390625, 2.790283203125, 2.9453125, 3.100341796875, 3.25537109375, 3.410400390625, 3.5654296875, 3.720458984375, 3.87548828125, 4.030517578125, 4.185546875, 4.340576171875, 4.49560546875, 4.650634765625, 4.8056640625, 4.960693359375, 5.11572265625, 5.270751953125, 5.42578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 5.0, 8.0, 7.0, 11.0, 15.0, 19.0, 28.0, 28.0, 27.0, 29.0, 45.0, 48.0, 52.0, 56.0, 53.0, 63.0, 54.0, 62.0, 66.0, 53.0, 46.0, 48.0, 30.0, 35.0, 24.0, 17.0, 16.0, 10.0, 12.0, 5.0, 10.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.173274040222168, -13.798551559448242, -13.423830032348633, -13.049107551574707, -12.674386024475098, -12.299663543701172, -11.924942016601562, -11.550219535827637, -11.175497055053711, -10.800774574279785, -10.426053047180176, -10.05133056640625, -9.67660903930664, -9.301886558532715, -8.927164077758789, -8.55244255065918, -8.17772102355957, -7.802999019622803, -7.428277015686035, -7.053554534912109, -6.6788330078125, -6.304110527038574, -5.929388523101807, -5.554666519165039, -5.1799445152282715, -4.805222511291504, -4.430500507354736, -4.055778503417969, -3.681056261062622, -3.3063342571258545, -2.931612014770508, -2.5568900108337402, -2.1821680068969727, -1.807446002960205, -1.432723879814148, -1.0580017566680908, -0.6832797527313232, -0.30855774879455566, 0.06616449356079102, 0.4408864974975586, 0.8156085014343262, 1.1903305053710938, 1.5650526285171509, 1.939774751663208, 2.3144967555999756, 2.689218759536743, 3.06394100189209, 3.4386630058288574, 3.813385009765625, 4.188107013702393, 4.56282901763916, 4.937551498413086, 5.312273025512695, 5.686995506286621, 6.061717510223389, 6.436439514160156, 6.811161518096924, 7.185883522033691, 7.560605525970459, 7.935327529907227, 8.310050010681152, 8.684771537780762, 9.059494018554688, 9.434215545654297, 9.808938026428223]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 2.0, 3.0, 5.0, 7.0, 12.0, 6.0, 10.0, 16.0, 13.0, 16.0, 18.0, 35.0, 27.0, 28.0, 35.0, 31.0, 35.0, 43.0, 48.0, 45.0, 43.0, 31.0, 52.0, 41.0, 26.0, 42.0, 35.0, 46.0, 31.0, 42.0, 28.0, 33.0, 17.0, 16.0, 15.0, 19.0, 14.0, 8.0, 9.0, 5.0, 9.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.746149063110352, -9.437788009643555, -9.129427909851074, -8.821066856384277, -8.512706756591797, -8.204345703125, -7.895984649658203, -7.5876240730285645, -7.279263496398926, -6.970902919769287, -6.662542343139648, -6.354181289672852, -6.045820713043213, -5.737460136413574, -5.429099082946777, -5.120738506317139, -4.8123779296875, -4.504017353057861, -4.195656776428223, -3.887295722961426, -3.578935146331787, -3.2705745697021484, -2.9622137546539307, -2.653852939605713, -2.345492362976074, -2.0371317863464355, -1.7287709712982178, -1.4204102754592896, -1.1120495796203613, -0.8036888837814331, -0.4953281879425049, -0.1869673728942871, 0.12139415740966797, 0.4297548532485962, 0.7381155490875244, 1.0464762449264526, 1.3548369407653809, 1.663197636604309, 1.9715583324432373, 2.279919147491455, 2.5882797241210938, 2.8966403007507324, 3.20500111579895, 3.513361930847168, 3.8217225074768066, 4.130083084106445, 4.438444137573242, 4.746804714202881, 5.0551652908325195, 5.363525867462158, 5.671886444091797, 5.980247497558594, 6.288608074188232, 6.596968650817871, 6.905329704284668, 7.213690280914307, 7.522050857543945, 7.830411434173584, 8.138772010803223, 8.44713306427002, 8.7554931640625, 9.063854217529297, 9.372215270996094, 9.68057632446289, 9.988936424255371]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 13.0, 10.0, 17.0, 34.0, 48.0, 69.0, 69.0, 109.0, 173.0, 272.0, 424.0, 607.0, 862.0, 1416.0, 2363.0, 3829.0, 6094.0, 10338.0, 17723.0, 31559.0, 56514.0, 101473.0, 170361.0, 219748.0, 177480.0, 106740.0, 60252.0, 33143.0, 18789.0, 10940.0, 6493.0, 3832.0, 2358.0, 1513.0, 958.0, 587.0, 442.0, 289.0, 194.0, 126.0, 100.0, 49.0, 37.0, 34.0, 18.0, 15.0, 14.0, 4.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.71875, -2.632568359375, -2.54638671875, -2.460205078125, -2.3740234375, -2.287841796875, -2.20166015625, -2.115478515625, -2.029296875, -1.943115234375, -1.85693359375, -1.770751953125, -1.6845703125, -1.598388671875, -1.51220703125, -1.426025390625, -1.33984375, -1.253662109375, -1.16748046875, -1.081298828125, -0.9951171875, -0.908935546875, -0.82275390625, -0.736572265625, -0.650390625, -0.564208984375, -0.47802734375, -0.391845703125, -0.3056640625, -0.219482421875, -0.13330078125, -0.047119140625, 0.0390625, 0.125244140625, 0.21142578125, 0.297607421875, 0.3837890625, 0.469970703125, 0.55615234375, 0.642333984375, 0.728515625, 0.814697265625, 0.90087890625, 0.987060546875, 1.0732421875, 1.159423828125, 1.24560546875, 1.331787109375, 1.41796875, 1.504150390625, 1.59033203125, 1.676513671875, 1.7626953125, 1.848876953125, 1.93505859375, 2.021240234375, 2.107421875, 2.193603515625, 2.27978515625, 2.365966796875, 2.4521484375, 2.538330078125, 2.62451171875, 2.710693359375, 2.796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 8.0, 5.0, 6.0, 6.0, 9.0, 8.0, 9.0, 15.0, 18.0, 17.0, 24.0, 28.0, 27.0, 33.0, 29.0, 43.0, 38.0, 46.0, 46.0, 40.0, 49.0, 52.0, 34.0, 41.0, 53.0, 38.0, 34.0, 29.0, 34.0, 27.0, 26.0, 26.0, 14.0, 21.0, 22.0, 14.0, 8.0, 6.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1953125, -7.952880859375, -7.71044921875, -7.468017578125, -7.2255859375, -6.983154296875, -6.74072265625, -6.498291015625, -6.255859375, -6.013427734375, -5.77099609375, -5.528564453125, -5.2861328125, -5.043701171875, -4.80126953125, -4.558837890625, -4.31640625, -4.073974609375, -3.83154296875, -3.589111328125, -3.3466796875, -3.104248046875, -2.86181640625, -2.619384765625, -2.376953125, -2.134521484375, -1.89208984375, -1.649658203125, -1.4072265625, -1.164794921875, -0.92236328125, -0.679931640625, -0.4375, -0.195068359375, 0.04736328125, 0.289794921875, 0.5322265625, 0.774658203125, 1.01708984375, 1.259521484375, 1.501953125, 1.744384765625, 1.98681640625, 2.229248046875, 2.4716796875, 2.714111328125, 2.95654296875, 3.198974609375, 3.44140625, 3.683837890625, 3.92626953125, 4.168701171875, 4.4111328125, 4.653564453125, 4.89599609375, 5.138427734375, 5.380859375, 5.623291015625, 5.86572265625, 6.108154296875, 6.3505859375, 6.593017578125, 6.83544921875, 7.077880859375, 7.3203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 3.0, 3.0, 0.0, 8.0, 6.0, 14.0, 15.0, 17.0, 35.0, 50.0, 62.0, 113.0, 156.0, 259.0, 506.0, 958.0, 2030.0, 5022.0, 13933.0, 46541.0, 185909.0, 478767.0, 230140.0, 56987.0, 16715.0, 5674.0, 2267.0, 1052.0, 530.0, 281.0, 183.0, 103.0, 75.0, 49.0, 22.0, 14.0, 19.0, 8.0, 8.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.91015625, -4.744140625, -4.578125, -4.412109375, -4.24609375, -4.080078125, -3.9140625, -3.748046875, -3.58203125, -3.416015625, -3.25, -3.083984375, -2.91796875, -2.751953125, -2.5859375, -2.419921875, -2.25390625, -2.087890625, -1.921875, -1.755859375, -1.58984375, -1.423828125, -1.2578125, -1.091796875, -0.92578125, -0.759765625, -0.59375, -0.427734375, -0.26171875, -0.095703125, 0.0703125, 0.236328125, 0.40234375, 0.568359375, 0.734375, 0.900390625, 1.06640625, 1.232421875, 1.3984375, 1.564453125, 1.73046875, 1.896484375, 2.0625, 2.228515625, 2.39453125, 2.560546875, 2.7265625, 2.892578125, 3.05859375, 3.224609375, 3.390625, 3.556640625, 3.72265625, 3.888671875, 4.0546875, 4.220703125, 4.38671875, 4.552734375, 4.71875, 4.884765625, 5.05078125, 5.216796875, 5.3828125, 5.548828125, 5.71484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 11.0, 11.0, 10.0, 10.0, 19.0, 11.0, 26.0, 16.0, 28.0, 19.0, 22.0, 34.0, 28.0, 27.0, 40.0, 59.0, 35.0, 36.0, 39.0, 42.0, 40.0, 51.0, 47.0, 34.0, 36.0, 34.0, 14.0, 23.0, 26.0, 19.0, 14.0, 19.0, 18.0, 14.0, 14.0, 13.0, 9.0, 7.0, 8.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.4140625, -13.9561767578125, -13.498291015625, -13.0404052734375, -12.58251953125, -12.1246337890625, -11.666748046875, -11.2088623046875, -10.7509765625, -10.2930908203125, -9.835205078125, -9.3773193359375, -8.91943359375, -8.4615478515625, -8.003662109375, -7.5457763671875, -7.087890625, -6.6300048828125, -6.172119140625, -5.7142333984375, -5.25634765625, -4.7984619140625, -4.340576171875, -3.8826904296875, -3.4248046875, -2.9669189453125, -2.509033203125, -2.0511474609375, -1.59326171875, -1.1353759765625, -0.677490234375, -0.2196044921875, 0.23828125, 0.6961669921875, 1.154052734375, 1.6119384765625, 2.06982421875, 2.5277099609375, 2.985595703125, 3.4434814453125, 3.9013671875, 4.3592529296875, 4.817138671875, 5.2750244140625, 5.73291015625, 6.1907958984375, 6.648681640625, 7.1065673828125, 7.564453125, 8.0223388671875, 8.480224609375, 8.9381103515625, 9.39599609375, 9.8538818359375, 10.311767578125, 10.7696533203125, 11.2275390625, 11.6854248046875, 12.143310546875, 12.6011962890625, 13.05908203125, 13.5169677734375, 13.974853515625, 14.4327392578125, 14.890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 8.0, 7.0, 18.0, 21.0, 34.0, 38.0, 59.0, 102.0, 144.0, 243.0, 362.0, 614.0, 1024.0, 1783.0, 3681.0, 8376.0, 24262.0, 121422.0, 673662.0, 164770.0, 29275.0, 9639.0, 4108.0, 2035.0, 1062.0, 647.0, 396.0, 249.0, 158.0, 97.0, 69.0, 46.0, 37.0, 29.0, 20.0, 20.0, 7.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.296875, -3.18902587890625, -3.0811767578125, -2.97332763671875, -2.865478515625, -2.75762939453125, -2.6497802734375, -2.54193115234375, -2.43408203125, -2.32623291015625, -2.2183837890625, -2.11053466796875, -2.002685546875, -1.89483642578125, -1.7869873046875, -1.67913818359375, -1.5712890625, -1.46343994140625, -1.3555908203125, -1.24774169921875, -1.139892578125, -1.03204345703125, -0.9241943359375, -0.81634521484375, -0.70849609375, -0.60064697265625, -0.4927978515625, -0.38494873046875, -0.277099609375, -0.16925048828125, -0.0614013671875, 0.04644775390625, 0.154296875, 0.26214599609375, 0.3699951171875, 0.47784423828125, 0.585693359375, 0.69354248046875, 0.8013916015625, 0.90924072265625, 1.01708984375, 1.12493896484375, 1.2327880859375, 1.34063720703125, 1.448486328125, 1.55633544921875, 1.6641845703125, 1.77203369140625, 1.8798828125, 1.98773193359375, 2.0955810546875, 2.20343017578125, 2.311279296875, 2.41912841796875, 2.5269775390625, 2.63482666015625, 2.74267578125, 2.85052490234375, 2.9583740234375, 3.06622314453125, 3.174072265625, 3.28192138671875, 3.3897705078125, 3.49761962890625, 3.60546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 10.0, 19.0, 19.0, 33.0, 55.0, 115.0, 132.0, 160.0, 154.0, 113.0, 59.0, 29.0, 18.0, 17.0, 12.0, 7.0, 9.0, 2.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002132415771484375, -0.002070903778076172, -0.0020093917846679688, -0.0019478797912597656, -0.0018863677978515625, -0.0018248558044433594, -0.0017633438110351562, -0.0017018318176269531, -0.00164031982421875, -0.0015788078308105469, -0.0015172958374023438, -0.0014557838439941406, -0.0013942718505859375, -0.0013327598571777344, -0.0012712478637695312, -0.0012097358703613281, -0.001148223876953125, -0.0010867118835449219, -0.0010251998901367188, -0.0009636878967285156, -0.0009021759033203125, -0.0008406639099121094, -0.0007791519165039062, -0.0007176399230957031, -0.0006561279296875, -0.0005946159362792969, -0.0005331039428710938, -0.0004715919494628906, -0.0004100799560546875, -0.0003485679626464844, -0.00028705596923828125, -0.00022554397583007812, -0.000164031982421875, -0.00010251998901367188, -4.100799560546875e-05, 2.0503997802734375e-05, 8.20159912109375e-05, 0.00014352798461914062, 0.00020503997802734375, 0.0002665519714355469, 0.00032806396484375, 0.0003895759582519531, 0.00045108795166015625, 0.0005125999450683594, 0.0005741119384765625, 0.0006356239318847656, 0.0006971359252929688, 0.0007586479187011719, 0.000820159912109375, 0.0008816719055175781, 0.0009431838989257812, 0.0010046958923339844, 0.0010662078857421875, 0.0011277198791503906, 0.0011892318725585938, 0.0012507438659667969, 0.001312255859375, 0.0013737678527832031, 0.0014352798461914062, 0.0014967918395996094, 0.0015583038330078125, 0.0016198158264160156, 0.0016813278198242188, 0.0017428398132324219, 0.001804351806640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 8.0, 9.0, 11.0, 10.0, 28.0, 49.0, 101.0, 242.0, 579.0, 2079.0, 11848.0, 477005.0, 540771.0, 12604.0, 2155.0, 590.0, 226.0, 91.0, 40.0, 28.0, 19.0, 11.0, 8.0, 6.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8984375, -9.607421875, -9.31640625, -9.025390625, -8.734375, -8.443359375, -8.15234375, -7.861328125, -7.5703125, -7.279296875, -6.98828125, -6.697265625, -6.40625, -6.115234375, -5.82421875, -5.533203125, -5.2421875, -4.951171875, -4.66015625, -4.369140625, -4.078125, -3.787109375, -3.49609375, -3.205078125, -2.9140625, -2.623046875, -2.33203125, -2.041015625, -1.75, -1.458984375, -1.16796875, -0.876953125, -0.5859375, -0.294921875, -0.00390625, 0.287109375, 0.578125, 0.869140625, 1.16015625, 1.451171875, 1.7421875, 2.033203125, 2.32421875, 2.615234375, 2.90625, 3.197265625, 3.48828125, 3.779296875, 4.0703125, 4.361328125, 4.65234375, 4.943359375, 5.234375, 5.525390625, 5.81640625, 6.107421875, 6.3984375, 6.689453125, 6.98046875, 7.271484375, 7.5625, 7.853515625, 8.14453125, 8.435546875, 8.7265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 3.0, 4.0, 5.0, 11.0, 5.0, 15.0, 24.0, 27.0, 45.0, 58.0, 87.0, 107.0, 130.0, 126.0, 82.0, 77.0, 54.0, 34.0, 22.0, 19.0, 13.0, 12.0, 12.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.177734375, -1.1428985595703125, -1.108062744140625, -1.0732269287109375, -1.03839111328125, -1.0035552978515625, -0.968719482421875, -0.9338836669921875, -0.8990478515625, -0.8642120361328125, -0.829376220703125, -0.7945404052734375, -0.75970458984375, -0.7248687744140625, -0.690032958984375, -0.6551971435546875, -0.620361328125, -0.5855255126953125, -0.550689697265625, -0.5158538818359375, -0.48101806640625, -0.4461822509765625, -0.411346435546875, -0.3765106201171875, -0.3416748046875, -0.3068389892578125, -0.272003173828125, -0.2371673583984375, -0.20233154296875, -0.1674957275390625, -0.132659912109375, -0.0978240966796875, -0.06298828125, -0.0281524658203125, 0.006683349609375, 0.0415191650390625, 0.07635498046875, 0.1111907958984375, 0.146026611328125, 0.1808624267578125, 0.2156982421875, 0.2505340576171875, 0.285369873046875, 0.3202056884765625, 0.35504150390625, 0.3898773193359375, 0.424713134765625, 0.4595489501953125, 0.494384765625, 0.5292205810546875, 0.564056396484375, 0.5988922119140625, 0.63372802734375, 0.6685638427734375, 0.703399658203125, 0.7382354736328125, 0.7730712890625, 0.8079071044921875, 0.842742919921875, 0.8775787353515625, 0.91241455078125, 0.9472503662109375, 0.982086181640625, 1.0169219970703125, 1.0517578125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 6.0, 10.0, 14.0, 23.0, 33.0, 33.0, 43.0, 60.0, 62.0, 79.0, 80.0, 94.0, 100.0, 72.0, 78.0, 53.0, 52.0, 31.0, 20.0, 12.0, 10.0, 11.0, 11.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.561897277832031, -14.15044116973877, -13.738984107971191, -13.32752799987793, -12.916071891784668, -12.504615783691406, -12.093158721923828, -11.681702613830566, -11.270246505737305, -10.858790397644043, -10.447333335876465, -10.035877227783203, -9.624421119689941, -9.21296501159668, -8.801507949829102, -8.39005184173584, -7.978594779968262, -7.567138195037842, -7.15568208694458, -6.74422550201416, -6.332769393920898, -5.9213128089904785, -5.509856224060059, -5.098400115966797, -4.686943531036377, -4.275486946105957, -3.8640308380126953, -3.4525742530822754, -3.0411179065704346, -2.6296615600585938, -2.218204975128174, -1.806748628616333, -1.3952922821044922, -0.9838358759880066, -0.572379469871521, -0.16092300415039062, 0.2505333423614502, 0.661989688873291, 1.073446273803711, 1.4849026203155518, 1.8963589668273926, 2.3078153133392334, 2.719271659851074, 3.130728244781494, 3.542184591293335, 3.953640937805176, 4.365097522735596, 4.776554107666016, 5.188010215759277, 5.599466800689697, 6.010922908782959, 6.422379493713379, 6.833835601806641, 7.2452921867370605, 7.6567487716674805, 8.068204879760742, 8.47966194152832, 8.891118049621582, 9.30257511138916, 9.714031219482422, 10.125487327575684, 10.536943435668945, 10.948400497436523, 11.359856605529785, 11.771312713623047]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 1.0, 5.0, 9.0, 7.0, 8.0, 8.0, 21.0, 13.0, 18.0, 15.0, 17.0, 24.0, 29.0, 38.0, 37.0, 40.0, 42.0, 39.0, 44.0, 44.0, 39.0, 44.0, 31.0, 44.0, 47.0, 27.0, 41.0, 24.0, 28.0, 26.0, 25.0, 30.0, 27.0, 23.0, 14.0, 14.0, 15.0, 9.0, 9.0, 2.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-8.162459373474121, -7.934866905212402, -7.707274436950684, -7.479681968688965, -7.252089500427246, -7.024497032165527, -6.796904563903809, -6.56931209564209, -6.341719627380371, -6.114127159118652, -5.886534690856934, -5.658942222595215, -5.431349754333496, -5.203757286071777, -4.976164817810059, -4.74857234954834, -4.520979404449463, -4.293386936187744, -4.065794467926025, -3.8382019996643066, -3.610609531402588, -3.383017063140869, -3.1554243564605713, -2.9278318881988525, -2.700239419937134, -2.472646951675415, -2.2450544834136963, -2.0174617767333984, -1.7898694276809692, -1.5622769594192505, -1.3346843719482422, -1.1070919036865234, -0.8794999122619629, -0.6519074440002441, -0.4243149161338806, -0.1967223882675171, 0.03087007999420166, 0.2584625482559204, 0.4860551357269287, 0.7136476039886475, 0.9412400722503662, 1.168832540512085, 1.3964250087738037, 1.624017596244812, 1.8516100645065308, 2.079202651977539, 2.306795120239258, 2.5343875885009766, 2.7619800567626953, 2.989572525024414, 3.217164993286133, 3.4447574615478516, 3.6723499298095703, 3.899942398071289, 4.127534866333008, 4.355127334594727, 4.582719802856445, 4.810312271118164, 5.037904739379883, 5.265497207641602, 5.49308967590332, 5.720682144165039, 5.948274612426758, 6.175867080688477, 6.4034600257873535]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 17.0, 27.0, 32.0, 38.0, 57.0, 96.0, 140.0, 206.0, 341.0, 539.0, 747.0, 1249.0, 2005.0, 3461.0, 5717.0, 10641.0, 19195.0, 37143.0, 72578.0, 144733.0, 239762.0, 230689.0, 135121.0, 67913.0, 34534.0, 17872.0, 9654.0, 5435.0, 3201.0, 1984.0, 1189.0, 746.0, 512.0, 315.0, 206.0, 152.0, 107.0, 51.0, 41.0, 26.0, 20.0, 13.0, 8.0, 3.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.6953125, -3.586456298828125, -3.47760009765625, -3.368743896484375, -3.2598876953125, -3.151031494140625, -3.04217529296875, -2.933319091796875, -2.824462890625, -2.715606689453125, -2.60675048828125, -2.497894287109375, -2.3890380859375, -2.280181884765625, -2.17132568359375, -2.062469482421875, -1.95361328125, -1.844757080078125, -1.73590087890625, -1.627044677734375, -1.5181884765625, -1.409332275390625, -1.30047607421875, -1.191619873046875, -1.082763671875, -0.973907470703125, -0.86505126953125, -0.756195068359375, -0.6473388671875, -0.538482666015625, -0.42962646484375, -0.320770263671875, -0.2119140625, -0.103057861328125, 0.00579833984375, 0.114654541015625, 0.2235107421875, 0.332366943359375, 0.44122314453125, 0.550079345703125, 0.658935546875, 0.767791748046875, 0.87664794921875, 0.985504150390625, 1.0943603515625, 1.203216552734375, 1.31207275390625, 1.420928955078125, 1.52978515625, 1.638641357421875, 1.74749755859375, 1.856353759765625, 1.9652099609375, 2.074066162109375, 2.18292236328125, 2.291778564453125, 2.400634765625, 2.509490966796875, 2.61834716796875, 2.727203369140625, 2.8360595703125, 2.944915771484375, 3.05377197265625, 3.162628173828125, 3.271484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 7.0, 5.0, 9.0, 10.0, 11.0, 24.0, 17.0, 11.0, 24.0, 28.0, 15.0, 30.0, 38.0, 35.0, 37.0, 31.0, 34.0, 47.0, 44.0, 40.0, 41.0, 39.0, 51.0, 38.0, 30.0, 34.0, 36.0, 36.0, 31.0, 30.0, 26.0, 13.0, 16.0, 18.0, 11.0, 10.0, 7.0, 6.0, 3.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-37.125, -36.01220703125, -34.8994140625, -33.78662109375, -32.673828125, -31.56103515625, -30.4482421875, -29.33544921875, -28.22265625, -27.10986328125, -25.9970703125, -24.88427734375, -23.771484375, -22.65869140625, -21.5458984375, -20.43310546875, -19.3203125, -18.20751953125, -17.0947265625, -15.98193359375, -14.869140625, -13.75634765625, -12.6435546875, -11.53076171875, -10.41796875, -9.30517578125, -8.1923828125, -7.07958984375, -5.966796875, -4.85400390625, -3.7412109375, -2.62841796875, -1.515625, -0.40283203125, 0.7099609375, 1.82275390625, 2.935546875, 4.04833984375, 5.1611328125, 6.27392578125, 7.38671875, 8.49951171875, 9.6123046875, 10.72509765625, 11.837890625, 12.95068359375, 14.0634765625, 15.17626953125, 16.2890625, 17.40185546875, 18.5146484375, 19.62744140625, 20.740234375, 21.85302734375, 22.9658203125, 24.07861328125, 25.19140625, 26.30419921875, 27.4169921875, 28.52978515625, 29.642578125, 30.75537109375, 31.8681640625, 32.98095703125, 34.09375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 8.0, 13.0, 16.0, 20.0, 18.0, 27.0, 34.0, 44.0, 62.0, 94.0, 116.0, 156.0, 249.0, 490.0, 1400.0, 13838.0, 576730.0, 442505.0, 10173.0, 1153.0, 477.0, 274.0, 162.0, 111.0, 78.0, 51.0, 52.0, 37.0, 39.0, 34.0, 20.0, 24.0, 10.0, 11.0, 8.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.237060546875, -16.66162109375, -16.086181640625, -15.5107421875, -14.935302734375, -14.35986328125, -13.784423828125, -13.208984375, -12.633544921875, -12.05810546875, -11.482666015625, -10.9072265625, -10.331787109375, -9.75634765625, -9.180908203125, -8.60546875, -8.030029296875, -7.45458984375, -6.879150390625, -6.3037109375, -5.728271484375, -5.15283203125, -4.577392578125, -4.001953125, -3.426513671875, -2.85107421875, -2.275634765625, -1.7001953125, -1.124755859375, -0.54931640625, 0.026123046875, 0.6015625, 1.177001953125, 1.75244140625, 2.327880859375, 2.9033203125, 3.478759765625, 4.05419921875, 4.629638671875, 5.205078125, 5.780517578125, 6.35595703125, 6.931396484375, 7.5068359375, 8.082275390625, 8.65771484375, 9.233154296875, 9.80859375, 10.384033203125, 10.95947265625, 11.534912109375, 12.1103515625, 12.685791015625, 13.26123046875, 13.836669921875, 14.412109375, 14.987548828125, 15.56298828125, 16.138427734375, 16.7138671875, 17.289306640625, 17.86474609375, 18.440185546875, 19.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 4.0, 15.0, 11.0, 17.0, 19.0, 33.0, 30.0, 29.0, 34.0, 40.0, 46.0, 63.0, 51.0, 54.0, 43.0, 66.0, 54.0, 52.0, 48.0, 52.0, 37.0, 27.0, 18.0, 31.0, 17.0, 15.0, 15.0, 19.0, 12.0, 11.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.71875, -36.48583984375, -35.2529296875, -34.02001953125, -32.787109375, -31.55419921875, -30.3212890625, -29.08837890625, -27.85546875, -26.62255859375, -25.3896484375, -24.15673828125, -22.923828125, -21.69091796875, -20.4580078125, -19.22509765625, -17.9921875, -16.75927734375, -15.5263671875, -14.29345703125, -13.060546875, -11.82763671875, -10.5947265625, -9.36181640625, -8.12890625, -6.89599609375, -5.6630859375, -4.43017578125, -3.197265625, -1.96435546875, -0.7314453125, 0.50146484375, 1.734375, 2.96728515625, 4.2001953125, 5.43310546875, 6.666015625, 7.89892578125, 9.1318359375, 10.36474609375, 11.59765625, 12.83056640625, 14.0634765625, 15.29638671875, 16.529296875, 17.76220703125, 18.9951171875, 20.22802734375, 21.4609375, 22.69384765625, 23.9267578125, 25.15966796875, 26.392578125, 27.62548828125, 28.8583984375, 30.09130859375, 31.32421875, 32.55712890625, 33.7900390625, 35.02294921875, 36.255859375, 37.48876953125, 38.7216796875, 39.95458984375, 41.1875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 2.0, 10.0, 11.0, 17.0, 35.0, 25.0, 49.0, 69.0, 92.0, 171.0, 307.0, 527.0, 1070.0, 2483.0, 6270.0, 18610.0, 94102.0, 704972.0, 177806.0, 27536.0, 8239.0, 3047.0, 1352.0, 689.0, 379.0, 236.0, 137.0, 73.0, 57.0, 48.0, 28.0, 21.0, 13.0, 12.0, 9.0, 15.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5478515625, -1.495635986328125, -1.44342041015625, -1.391204833984375, -1.3389892578125, -1.286773681640625, -1.23455810546875, -1.182342529296875, -1.130126953125, -1.077911376953125, -1.02569580078125, -0.973480224609375, -0.9212646484375, -0.869049072265625, -0.81683349609375, -0.764617919921875, -0.71240234375, -0.660186767578125, -0.60797119140625, -0.555755615234375, -0.5035400390625, -0.451324462890625, -0.39910888671875, -0.346893310546875, -0.294677734375, -0.242462158203125, -0.19024658203125, -0.138031005859375, -0.0858154296875, -0.033599853515625, 0.01861572265625, 0.070831298828125, 0.123046875, 0.175262451171875, 0.22747802734375, 0.279693603515625, 0.3319091796875, 0.384124755859375, 0.43634033203125, 0.488555908203125, 0.540771484375, 0.592987060546875, 0.64520263671875, 0.697418212890625, 0.7496337890625, 0.801849365234375, 0.85406494140625, 0.906280517578125, 0.95849609375, 1.010711669921875, 1.06292724609375, 1.115142822265625, 1.1673583984375, 1.219573974609375, 1.27178955078125, 1.324005126953125, 1.376220703125, 1.428436279296875, 1.48065185546875, 1.532867431640625, 1.5850830078125, 1.637298583984375, 1.68951416015625, 1.741729736328125, 1.7939453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 4.0, 5.0, 5.0, 18.0, 25.0, 20.0, 36.0, 57.0, 73.0, 143.0, 173.0, 133.0, 93.0, 65.0, 43.0, 28.0, 19.0, 11.0, 6.0, 9.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003361701965332031, -0.00032558292150497437, -0.0003149956464767456, -0.00030440837144851685, -0.0002938210964202881, -0.0002832338213920593, -0.00027264654636383057, -0.0002620592713356018, -0.00025147199630737305, -0.0002408847212791443, -0.00023029744625091553, -0.00021971017122268677, -0.000209122896194458, -0.00019853562116622925, -0.0001879483461380005, -0.00017736107110977173, -0.00016677379608154297, -0.0001561865210533142, -0.00014559924602508545, -0.0001350119709968567, -0.00012442469596862793, -0.00011383742094039917, -0.00010325014591217041, -9.266287088394165e-05, -8.207559585571289e-05, -7.148832082748413e-05, -6.090104579925537e-05, -5.031377077102661e-05, -3.972649574279785e-05, -2.9139220714569092e-05, -1.8551945686340332e-05, -7.964670658111572e-06, 2.6226043701171875e-06, 1.3209879398345947e-05, 2.3797154426574707e-05, 3.438442945480347e-05, 4.4971704483032227e-05, 5.5558979511260986e-05, 6.614625453948975e-05, 7.67335295677185e-05, 8.732080459594727e-05, 9.790807962417603e-05, 0.00010849535465240479, 0.00011908262968063354, 0.0001296699047088623, 0.00014025717973709106, 0.00015084445476531982, 0.00016143172979354858, 0.00017201900482177734, 0.0001826062798500061, 0.00019319355487823486, 0.00020378082990646362, 0.00021436810493469238, 0.00022495537996292114, 0.0002355426549911499, 0.00024612993001937866, 0.0002567172050476074, 0.0002673044800758362, 0.00027789175510406494, 0.0002884790301322937, 0.00029906630516052246, 0.0003096535801887512, 0.00032024085521698, 0.00033082813024520874, 0.0003414154052734375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 8.0, 9.0, 10.0, 13.0, 19.0, 26.0, 43.0, 47.0, 57.0, 101.0, 148.0, 244.0, 451.0, 771.0, 1349.0, 2649.0, 5686.0, 14124.0, 42669.0, 237272.0, 616950.0, 86488.0, 22718.0, 8582.0, 3778.0, 1916.0, 970.0, 529.0, 345.0, 204.0, 115.0, 86.0, 44.0, 32.0, 18.0, 13.0, 14.0, 14.0, 6.0, 8.0, 7.0, 2.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0], "bins": [-1.5556640625, -1.510223388671875, -1.46478271484375, -1.419342041015625, -1.3739013671875, -1.328460693359375, -1.28302001953125, -1.237579345703125, -1.192138671875, -1.146697998046875, -1.10125732421875, -1.055816650390625, -1.0103759765625, -0.964935302734375, -0.91949462890625, -0.874053955078125, -0.82861328125, -0.783172607421875, -0.73773193359375, -0.692291259765625, -0.6468505859375, -0.601409912109375, -0.55596923828125, -0.510528564453125, -0.465087890625, -0.419647216796875, -0.37420654296875, -0.328765869140625, -0.2833251953125, -0.237884521484375, -0.19244384765625, -0.147003173828125, -0.1015625, -0.056121826171875, -0.01068115234375, 0.034759521484375, 0.0802001953125, 0.125640869140625, 0.17108154296875, 0.216522216796875, 0.261962890625, 0.307403564453125, 0.35284423828125, 0.398284912109375, 0.4437255859375, 0.489166259765625, 0.53460693359375, 0.580047607421875, 0.62548828125, 0.670928955078125, 0.71636962890625, 0.761810302734375, 0.8072509765625, 0.852691650390625, 0.89813232421875, 0.943572998046875, 0.989013671875, 1.034454345703125, 1.07989501953125, 1.125335693359375, 1.1707763671875, 1.216217041015625, 1.26165771484375, 1.307098388671875, 1.3525390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 1.0, 5.0, 5.0, 3.0, 3.0, 8.0, 8.0, 8.0, 14.0, 14.0, 29.0, 45.0, 40.0, 52.0, 66.0, 74.0, 138.0, 120.0, 87.0, 44.0, 45.0, 28.0, 27.0, 33.0, 23.0, 13.0, 11.0, 10.0, 8.0, 7.0, 2.0, 5.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6075897216796875, -0.589691162109375, -0.5717926025390625, -0.55389404296875, -0.5359954833984375, -0.518096923828125, -0.5001983642578125, -0.4822998046875, -0.4644012451171875, -0.446502685546875, -0.4286041259765625, -0.41070556640625, -0.3928070068359375, -0.374908447265625, -0.3570098876953125, -0.339111328125, -0.3212127685546875, -0.303314208984375, -0.2854156494140625, -0.26751708984375, -0.2496185302734375, -0.231719970703125, -0.2138214111328125, -0.1959228515625, -0.1780242919921875, -0.160125732421875, -0.1422271728515625, -0.12432861328125, -0.1064300537109375, -0.088531494140625, -0.0706329345703125, -0.052734375, -0.0348358154296875, -0.016937255859375, 0.0009613037109375, 0.01885986328125, 0.0367584228515625, 0.054656982421875, 0.0725555419921875, 0.0904541015625, 0.1083526611328125, 0.126251220703125, 0.1441497802734375, 0.16204833984375, 0.1799468994140625, 0.197845458984375, 0.2157440185546875, 0.233642578125, 0.2515411376953125, 0.269439697265625, 0.2873382568359375, 0.30523681640625, 0.3231353759765625, 0.341033935546875, 0.3589324951171875, 0.3768310546875, 0.3947296142578125, 0.412628173828125, 0.4305267333984375, 0.44842529296875, 0.4663238525390625, 0.484222412109375, 0.5021209716796875, 0.52001953125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 20.0, 88.0, 236.0, 338.0, 231.0, 80.0, 16.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.21491813659668, -11.640115737915039, -9.065313339233398, -6.490509986877441, -3.915707588195801, -1.3409051895141602, 1.2338981628417969, 3.8087005615234375, 6.383502960205078, 8.958305358886719, 11.53310775756836, 14.107911109924316, 16.68271255493164, 19.25751495361328, 21.832319259643555, 24.407121658325195, 26.981924057006836, 29.556726455688477, 32.13153076171875, 34.70633316040039, 37.28113555908203, 39.85593795776367, 42.43074035644531, 45.00554275512695, 47.580345153808594, 50.155147552490234, 52.729949951171875, 55.304752349853516, 57.879554748535156, 60.4543571472168, 63.02915954589844, 65.60396575927734, 68.17876434326172, 70.75357055664062, 73.328369140625, 75.9031753540039, 78.47797393798828, 81.05278015136719, 83.62757873535156, 86.20238494873047, 88.77718353271484, 91.35198974609375, 93.92678833007812, 96.50159454345703, 99.0763931274414, 101.65119934082031, 104.22599792480469, 106.8008041381836, 109.3756103515625, 111.9504165649414, 114.52521514892578, 117.10002136230469, 119.67481994628906, 122.24962615966797, 124.82442474365234, 127.39923095703125, 129.97402954101562, 132.548828125, 135.12364196777344, 137.6984405517578, 140.2732391357422, 142.84803771972656, 145.4228515625, 147.99765014648438, 150.57244873046875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 7.0, 4.0, 11.0, 13.0, 8.0, 10.0, 17.0, 21.0, 17.0, 15.0, 20.0, 14.0, 33.0, 31.0, 28.0, 28.0, 32.0, 34.0, 38.0, 33.0, 40.0, 38.0, 34.0, 38.0, 37.0, 37.0, 41.0, 26.0, 31.0, 31.0, 34.0, 28.0, 23.0, 23.0, 22.0, 17.0, 14.0, 15.0, 12.0, 8.0, 9.0, 7.0, 12.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-54.5134162902832, -52.98008728027344, -51.44675827026367, -49.913429260253906, -48.380104064941406, -46.84677505493164, -45.313446044921875, -43.78011703491211, -42.246788024902344, -40.71345901489258, -39.18013000488281, -37.64680099487305, -36.11347198486328, -34.58014678955078, -33.046817779541016, -31.51348876953125, -29.980159759521484, -28.44683074951172, -26.913501739501953, -25.38017463684082, -23.846845626831055, -22.31351661682129, -20.780189514160156, -19.24686050415039, -17.713531494140625, -16.18020248413086, -14.64687442779541, -13.113546371459961, -11.580217361450195, -10.04688835144043, -8.51356029510498, -6.980232238769531, -5.446903228759766, -3.913574695587158, -2.380246162414551, -0.8469176292419434, 0.6864109039306641, 2.2197394371032715, 3.753067970275879, 5.286396026611328, 6.819725036621094, 8.35305404663086, 9.886382102966309, 11.419710159301758, 12.953039169311523, 14.486368179321289, 16.019695281982422, 17.553024291992188, 19.086353302001953, 20.61968231201172, 22.153011322021484, 23.686338424682617, 25.219667434692383, 26.75299644470215, 28.28632354736328, 29.819652557373047, 31.352981567382812, 32.88631057739258, 34.419639587402344, 35.95296859741211, 37.486297607421875, 39.019622802734375, 40.55295181274414, 42.086280822753906, 43.61960983276367]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 10.0, 4.0, 11.0, 22.0, 21.0, 21.0, 36.0, 67.0, 101.0, 150.0, 236.0, 422.0, 689.0, 1216.0, 2306.0, 4513.0, 9527.0, 22741.0, 67266.0, 299305.0, 1363011.0, 1838139.0, 440160.0, 93153.0, 28549.0, 11492.0, 5197.0, 2538.0, 1398.0, 778.0, 439.0, 256.0, 169.0, 105.0, 73.0, 39.0, 36.0, 25.0, 17.0, 15.0, 14.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.3515625, -10.0189208984375, -9.686279296875, -9.3536376953125, -9.02099609375, -8.6883544921875, -8.355712890625, -8.0230712890625, -7.6904296875, -7.3577880859375, -7.025146484375, -6.6925048828125, -6.35986328125, -6.0272216796875, -5.694580078125, -5.3619384765625, -5.029296875, -4.6966552734375, -4.364013671875, -4.0313720703125, -3.69873046875, -3.3660888671875, -3.033447265625, -2.7008056640625, -2.3681640625, -2.0355224609375, -1.702880859375, -1.3702392578125, -1.03759765625, -0.7049560546875, -0.372314453125, -0.0396728515625, 0.29296875, 0.6256103515625, 0.958251953125, 1.2908935546875, 1.62353515625, 1.9561767578125, 2.288818359375, 2.6214599609375, 2.9541015625, 3.2867431640625, 3.619384765625, 3.9520263671875, 4.28466796875, 4.6173095703125, 4.949951171875, 5.2825927734375, 5.615234375, 5.9478759765625, 6.280517578125, 6.6131591796875, 6.94580078125, 7.2784423828125, 7.611083984375, 7.9437255859375, 8.2763671875, 8.6090087890625, 8.941650390625, 9.2742919921875, 9.60693359375, 9.9395751953125, 10.272216796875, 10.6048583984375, 10.9375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 8.0, 14.0, 18.0, 22.0, 19.0, 19.0, 34.0, 35.0, 28.0, 34.0, 43.0, 39.0, 45.0, 38.0, 42.0, 44.0, 58.0, 33.0, 52.0, 35.0, 47.0, 29.0, 44.0, 27.0, 34.0, 29.0, 14.0, 18.0, 9.0, 8.0, 15.0, 5.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-10.1015625, -9.82958984375, -9.5576171875, -9.28564453125, -9.013671875, -8.74169921875, -8.4697265625, -8.19775390625, -7.92578125, -7.65380859375, -7.3818359375, -7.10986328125, -6.837890625, -6.56591796875, -6.2939453125, -6.02197265625, -5.75, -5.47802734375, -5.2060546875, -4.93408203125, -4.662109375, -4.39013671875, -4.1181640625, -3.84619140625, -3.57421875, -3.30224609375, -3.0302734375, -2.75830078125, -2.486328125, -2.21435546875, -1.9423828125, -1.67041015625, -1.3984375, -1.12646484375, -0.8544921875, -0.58251953125, -0.310546875, -0.03857421875, 0.2333984375, 0.50537109375, 0.77734375, 1.04931640625, 1.3212890625, 1.59326171875, 1.865234375, 2.13720703125, 2.4091796875, 2.68115234375, 2.953125, 3.22509765625, 3.4970703125, 3.76904296875, 4.041015625, 4.31298828125, 4.5849609375, 4.85693359375, 5.12890625, 5.40087890625, 5.6728515625, 5.94482421875, 6.216796875, 6.48876953125, 6.7607421875, 7.03271484375, 7.3046875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 15.0, 16.0, 46.0, 216.0, 3854418.0, 339300.0, 169.0, 46.0, 18.0, 17.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-410.5, -400.23046875, -389.9609375, -379.69140625, -369.421875, -359.15234375, -348.8828125, -338.61328125, -328.34375, -318.07421875, -307.8046875, -297.53515625, -287.265625, -276.99609375, -266.7265625, -256.45703125, -246.1875, -235.91796875, -225.6484375, -215.37890625, -205.109375, -194.83984375, -184.5703125, -174.30078125, -164.03125, -153.76171875, -143.4921875, -133.22265625, -122.953125, -112.68359375, -102.4140625, -92.14453125, -81.875, -71.60546875, -61.3359375, -51.06640625, -40.796875, -30.52734375, -20.2578125, -9.98828125, 0.28125, 10.55078125, 20.8203125, 31.08984375, 41.359375, 51.62890625, 61.8984375, 72.16796875, 82.4375, 92.70703125, 102.9765625, 113.24609375, 123.515625, 133.78515625, 144.0546875, 154.32421875, 164.59375, 174.86328125, 185.1328125, 195.40234375, 205.671875, 215.94140625, 226.2109375, 236.48046875, 246.75]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 22.0, 25.0, 26.0, 40.0, 52.0, 88.0, 136.0, 208.0, 346.0, 572.0, 868.0, 639.0, 376.0, 226.0, 144.0, 104.0, 59.0, 41.0, 16.0, 21.0, 16.0, 11.0, 3.0, 4.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.62213134765625, -4.4708251953125, -4.31951904296875, -4.168212890625, -4.01690673828125, -3.8656005859375, -3.71429443359375, -3.56298828125, -3.41168212890625, -3.2603759765625, -3.10906982421875, -2.957763671875, -2.80645751953125, -2.6551513671875, -2.50384521484375, -2.3525390625, -2.20123291015625, -2.0499267578125, -1.89862060546875, -1.747314453125, -1.59600830078125, -1.4447021484375, -1.29339599609375, -1.14208984375, -0.99078369140625, -0.8394775390625, -0.68817138671875, -0.536865234375, -0.38555908203125, -0.2342529296875, -0.08294677734375, 0.068359375, 0.21966552734375, 0.3709716796875, 0.52227783203125, 0.673583984375, 0.82489013671875, 0.9761962890625, 1.12750244140625, 1.27880859375, 1.43011474609375, 1.5814208984375, 1.73272705078125, 1.884033203125, 2.03533935546875, 2.1866455078125, 2.33795166015625, 2.4892578125, 2.64056396484375, 2.7918701171875, 2.94317626953125, 3.094482421875, 3.24578857421875, 3.3970947265625, 3.54840087890625, 3.69970703125, 3.85101318359375, 4.0023193359375, 4.15362548828125, 4.304931640625, 4.45623779296875, 4.6075439453125, 4.75885009765625, 4.91015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 9.0, 26.0, 33.0, 40.0, 50.0, 78.0, 80.0, 104.0, 114.0, 97.0, 83.0, 61.0, 78.0, 40.0, 31.0, 18.0, 18.0, 13.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.420784950256348, -14.867645263671875, -14.314505577087402, -13.76136589050293, -13.208227157592773, -12.655086517333984, -12.101947784423828, -11.548808097839355, -10.995668411254883, -10.44252872467041, -9.889389038085938, -9.336249351501465, -8.783109664916992, -8.229970932006836, -7.676831245422363, -7.123691558837891, -6.570551872253418, -6.017412185668945, -5.464272499084473, -4.911133289337158, -4.3579936027526855, -3.804853916168213, -3.2517144680023193, -2.698575019836426, -2.145435333251953, -1.59229576587677, -1.039156198501587, -0.4860166311264038, 0.0671229362487793, 0.620262622833252, 1.1734020709991455, 1.726541519165039, 2.279682159423828, 2.832821846008301, 3.3859612941741943, 3.939100742340088, 4.4922404289245605, 5.045380115509033, 5.598519325256348, 6.15165901184082, 6.704798698425293, 7.257938385009766, 7.811078071594238, 8.364217758178711, 8.917356491088867, 9.470497131347656, 10.023635864257812, 10.576775550842285, 11.129915237426758, 11.68305492401123, 12.236194610595703, 12.789334297180176, 13.342473983764648, 13.895612716674805, 14.448752403259277, 15.00189208984375, 15.555031776428223, 16.108171463012695, 16.66131019592285, 17.21445083618164, 17.767589569091797, 18.320730209350586, 18.873868942260742, 19.42700958251953, 19.980148315429688]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 9.0, 7.0, 12.0, 9.0, 16.0, 23.0, 21.0, 33.0, 24.0, 26.0, 29.0, 28.0, 35.0, 40.0, 55.0, 42.0, 46.0, 51.0, 37.0, 47.0, 46.0, 40.0, 36.0, 35.0, 27.0, 23.0, 35.0, 19.0, 25.0, 21.0, 15.0, 18.0, 14.0, 14.0, 13.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.179637908935547, -8.89326286315918, -8.606888771057129, -8.320513725280762, -8.034138679504395, -7.7477641105651855, -7.461389541625977, -7.175014495849609, -6.8886399269104, -6.602265357971191, -6.315890312194824, -6.029515743255615, -5.743141174316406, -5.456766128540039, -5.17039155960083, -4.884016990661621, -4.597641944885254, -4.311267375946045, -4.024892330169678, -3.7385177612304688, -3.4521429538726807, -3.1657681465148926, -2.8793935775756836, -2.5930187702178955, -2.3066439628601074, -2.0202691555023193, -1.7338944673538208, -1.4475197792053223, -1.1611449718475342, -0.8747701644897461, -0.5883954763412476, -0.302020788192749, -0.015646934509277344, 0.27072781324386597, 0.5571025609970093, 0.8434773087501526, 1.129852056503296, 1.416226863861084, 1.7026015520095825, 1.988976240158081, 2.275351047515869, 2.5617258548736572, 2.8481006622314453, 3.1344752311706543, 3.4208500385284424, 3.7072248458862305, 3.9935994148254395, 4.279973983764648, 4.566349029541016, 4.852723598480225, 5.139098644256592, 5.425473213195801, 5.711848258972168, 5.998222827911377, 6.284597396850586, 6.570972442626953, 6.857347011566162, 7.143721580505371, 7.430096626281738, 7.716471195220947, 8.002845764160156, 8.289220809936523, 8.57559585571289, 8.861969947814941, 9.148344993591309]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 5.0, 10.0, 13.0, 25.0, 50.0, 65.0, 126.0, 197.0, 395.0, 635.0, 1182.0, 2291.0, 4624.0, 10327.0, 24724.0, 66349.0, 178856.0, 359565.0, 244010.0, 94274.0, 34591.0, 13863.0, 6096.0, 2908.0, 1533.0, 806.0, 438.0, 248.0, 141.0, 83.0, 51.0, 21.0, 20.0, 15.0, 10.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.21795654296875, -4.0804443359375, -3.94293212890625, -3.805419921875, -3.66790771484375, -3.5303955078125, -3.39288330078125, -3.25537109375, -3.11785888671875, -2.9803466796875, -2.84283447265625, -2.705322265625, -2.56781005859375, -2.4302978515625, -2.29278564453125, -2.1552734375, -2.01776123046875, -1.8802490234375, -1.74273681640625, -1.605224609375, -1.46771240234375, -1.3302001953125, -1.19268798828125, -1.05517578125, -0.91766357421875, -0.7801513671875, -0.64263916015625, -0.505126953125, -0.36761474609375, -0.2301025390625, -0.09259033203125, 0.044921875, 0.18243408203125, 0.3199462890625, 0.45745849609375, 0.594970703125, 0.73248291015625, 0.8699951171875, 1.00750732421875, 1.14501953125, 1.28253173828125, 1.4200439453125, 1.55755615234375, 1.695068359375, 1.83258056640625, 1.9700927734375, 2.10760498046875, 2.2451171875, 2.38262939453125, 2.5201416015625, 2.65765380859375, 2.795166015625, 2.93267822265625, 3.0701904296875, 3.20770263671875, 3.34521484375, 3.48272705078125, 3.6202392578125, 3.75775146484375, 3.895263671875, 4.03277587890625, 4.1702880859375, 4.30780029296875, 4.4453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 4.0, 4.0, 7.0, 10.0, 8.0, 14.0, 16.0, 18.0, 28.0, 17.0, 23.0, 41.0, 31.0, 43.0, 48.0, 47.0, 47.0, 50.0, 41.0, 57.0, 47.0, 55.0, 42.0, 37.0, 29.0, 35.0, 31.0, 32.0, 23.0, 25.0, 16.0, 14.0, 20.0, 9.0, 9.0, 7.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-7.6953125, -7.49102783203125, -7.2867431640625, -7.08245849609375, -6.878173828125, -6.67388916015625, -6.4696044921875, -6.26531982421875, -6.06103515625, -5.85675048828125, -5.6524658203125, -5.44818115234375, -5.243896484375, -5.03961181640625, -4.8353271484375, -4.63104248046875, -4.4267578125, -4.22247314453125, -4.0181884765625, -3.81390380859375, -3.609619140625, -3.40533447265625, -3.2010498046875, -2.99676513671875, -2.79248046875, -2.58819580078125, -2.3839111328125, -2.17962646484375, -1.975341796875, -1.77105712890625, -1.5667724609375, -1.36248779296875, -1.158203125, -0.95391845703125, -0.7496337890625, -0.54534912109375, -0.341064453125, -0.13677978515625, 0.0675048828125, 0.27178955078125, 0.47607421875, 0.68035888671875, 0.8846435546875, 1.08892822265625, 1.293212890625, 1.49749755859375, 1.7017822265625, 1.90606689453125, 2.1103515625, 2.31463623046875, 2.5189208984375, 2.72320556640625, 2.927490234375, 3.13177490234375, 3.3360595703125, 3.54034423828125, 3.74462890625, 3.94891357421875, 4.1531982421875, 4.35748291015625, 4.561767578125, 4.76605224609375, 4.9703369140625, 5.17462158203125, 5.37890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 9.0, 13.0, 14.0, 27.0, 37.0, 67.0, 97.0, 124.0, 209.0, 351.0, 635.0, 1093.0, 2201.0, 4759.0, 11178.0, 28850.0, 84602.0, 265057.0, 411362.0, 155680.0, 49827.0, 18139.0, 7279.0, 3320.0, 1642.0, 767.0, 455.0, 260.0, 159.0, 95.0, 67.0, 38.0, 36.0, 28.0, 17.0, 7.0, 6.0, 8.0, 6.0, 2.0, 3.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.2265625, -4.09136962890625, -3.9561767578125, -3.82098388671875, -3.685791015625, -3.55059814453125, -3.4154052734375, -3.28021240234375, -3.14501953125, -3.00982666015625, -2.8746337890625, -2.73944091796875, -2.604248046875, -2.46905517578125, -2.3338623046875, -2.19866943359375, -2.0634765625, -1.92828369140625, -1.7930908203125, -1.65789794921875, -1.522705078125, -1.38751220703125, -1.2523193359375, -1.11712646484375, -0.98193359375, -0.84674072265625, -0.7115478515625, -0.57635498046875, -0.441162109375, -0.30596923828125, -0.1707763671875, -0.03558349609375, 0.099609375, 0.23480224609375, 0.3699951171875, 0.50518798828125, 0.640380859375, 0.77557373046875, 0.9107666015625, 1.04595947265625, 1.18115234375, 1.31634521484375, 1.4515380859375, 1.58673095703125, 1.721923828125, 1.85711669921875, 1.9923095703125, 2.12750244140625, 2.2626953125, 2.39788818359375, 2.5330810546875, 2.66827392578125, 2.803466796875, 2.93865966796875, 3.0738525390625, 3.20904541015625, 3.34423828125, 3.47943115234375, 3.6146240234375, 3.74981689453125, 3.885009765625, 4.02020263671875, 4.1553955078125, 4.29058837890625, 4.42578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 2.0, 8.0, 6.0, 5.0, 10.0, 16.0, 21.0, 14.0, 15.0, 24.0, 16.0, 26.0, 34.0, 23.0, 33.0, 43.0, 35.0, 44.0, 37.0, 43.0, 47.0, 35.0, 48.0, 44.0, 47.0, 39.0, 31.0, 36.0, 42.0, 27.0, 12.0, 17.0, 21.0, 12.0, 12.0, 15.0, 8.0, 13.0, 9.0, 4.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 6.0], "bins": [-12.5546875, -12.21630859375, -11.8779296875, -11.53955078125, -11.201171875, -10.86279296875, -10.5244140625, -10.18603515625, -9.84765625, -9.50927734375, -9.1708984375, -8.83251953125, -8.494140625, -8.15576171875, -7.8173828125, -7.47900390625, -7.140625, -6.80224609375, -6.4638671875, -6.12548828125, -5.787109375, -5.44873046875, -5.1103515625, -4.77197265625, -4.43359375, -4.09521484375, -3.7568359375, -3.41845703125, -3.080078125, -2.74169921875, -2.4033203125, -2.06494140625, -1.7265625, -1.38818359375, -1.0498046875, -0.71142578125, -0.373046875, -0.03466796875, 0.3037109375, 0.64208984375, 0.98046875, 1.31884765625, 1.6572265625, 1.99560546875, 2.333984375, 2.67236328125, 3.0107421875, 3.34912109375, 3.6875, 4.02587890625, 4.3642578125, 4.70263671875, 5.041015625, 5.37939453125, 5.7177734375, 6.05615234375, 6.39453125, 6.73291015625, 7.0712890625, 7.40966796875, 7.748046875, 8.08642578125, 8.4248046875, 8.76318359375, 9.1015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 5.0, 16.0, 15.0, 28.0, 28.0, 49.0, 50.0, 98.0, 133.0, 286.0, 519.0, 980.0, 1956.0, 4909.0, 13979.0, 49075.0, 243317.0, 552220.0, 134330.0, 30175.0, 9435.0, 3604.0, 1579.0, 737.0, 388.0, 228.0, 123.0, 89.0, 58.0, 43.0, 21.0, 15.0, 11.0, 10.0, 7.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.521484375, -2.4434814453125, -2.365478515625, -2.2874755859375, -2.20947265625, -2.1314697265625, -2.053466796875, -1.9754638671875, -1.8974609375, -1.8194580078125, -1.741455078125, -1.6634521484375, -1.58544921875, -1.5074462890625, -1.429443359375, -1.3514404296875, -1.2734375, -1.1954345703125, -1.117431640625, -1.0394287109375, -0.96142578125, -0.8834228515625, -0.805419921875, -0.7274169921875, -0.6494140625, -0.5714111328125, -0.493408203125, -0.4154052734375, -0.33740234375, -0.2593994140625, -0.181396484375, -0.1033935546875, -0.025390625, 0.0526123046875, 0.130615234375, 0.2086181640625, 0.28662109375, 0.3646240234375, 0.442626953125, 0.5206298828125, 0.5986328125, 0.6766357421875, 0.754638671875, 0.8326416015625, 0.91064453125, 0.9886474609375, 1.066650390625, 1.1446533203125, 1.22265625, 1.3006591796875, 1.378662109375, 1.4566650390625, 1.53466796875, 1.6126708984375, 1.690673828125, 1.7686767578125, 1.8466796875, 1.9246826171875, 2.002685546875, 2.0806884765625, 2.15869140625, 2.2366943359375, 2.314697265625, 2.3927001953125, 2.470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 15.0, 8.0, 17.0, 13.0, 25.0, 31.0, 26.0, 42.0, 54.0, 71.0, 75.0, 99.0, 76.0, 92.0, 68.0, 51.0, 46.0, 38.0, 39.0, 14.0, 14.0, 15.0, 11.0, 14.0, 12.0, 10.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0011110305786132812, -0.0010795444250106812, -0.001048058271408081, -0.001016572117805481, -0.0009850859642028809, -0.0009535998106002808, -0.0009221136569976807, -0.0008906275033950806, -0.0008591413497924805, -0.0008276551961898804, -0.0007961690425872803, -0.0007646828889846802, -0.0007331967353820801, -0.00070171058177948, -0.0006702244281768799, -0.0006387382745742798, -0.0006072521209716797, -0.0005757659673690796, -0.0005442798137664795, -0.0005127936601638794, -0.0004813075065612793, -0.0004498213529586792, -0.0004183351993560791, -0.000386849045753479, -0.0003553628921508789, -0.0003238767385482788, -0.0002923905849456787, -0.0002609044313430786, -0.00022941827774047852, -0.00019793212413787842, -0.00016644597053527832, -0.00013495981693267822, -0.00010347366333007812, -7.198750972747803e-05, -4.050135612487793e-05, -9.015202522277832e-06, 2.2470951080322266e-05, 5.395710468292236e-05, 8.544325828552246e-05, 0.00011692941188812256, 0.00014841556549072266, 0.00017990171909332275, 0.00021138787269592285, 0.00024287402629852295, 0.00027436017990112305, 0.00030584633350372314, 0.00033733248710632324, 0.00036881864070892334, 0.00040030479431152344, 0.00043179094791412354, 0.00046327710151672363, 0.0004947632551193237, 0.0005262494087219238, 0.0005577355623245239, 0.000589221715927124, 0.0006207078695297241, 0.0006521940231323242, 0.0006836801767349243, 0.0007151663303375244, 0.0007466524839401245, 0.0007781386375427246, 0.0008096247911453247, 0.0008411109447479248, 0.0008725970983505249, 0.000904083251953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 3.0, 11.0, 20.0, 8.0, 20.0, 24.0, 28.0, 38.0, 74.0, 135.0, 383.0, 1536.0, 11829.0, 276534.0, 723367.0, 30615.0, 2799.0, 630.0, 204.0, 89.0, 53.0, 35.0, 24.0, 14.0, 14.0, 13.0, 10.0, 8.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.22265625, -5.049560546875, -4.87646484375, -4.703369140625, -4.5302734375, -4.357177734375, -4.18408203125, -4.010986328125, -3.837890625, -3.664794921875, -3.49169921875, -3.318603515625, -3.1455078125, -2.972412109375, -2.79931640625, -2.626220703125, -2.453125, -2.280029296875, -2.10693359375, -1.933837890625, -1.7607421875, -1.587646484375, -1.41455078125, -1.241455078125, -1.068359375, -0.895263671875, -0.72216796875, -0.549072265625, -0.3759765625, -0.202880859375, -0.02978515625, 0.143310546875, 0.31640625, 0.489501953125, 0.66259765625, 0.835693359375, 1.0087890625, 1.181884765625, 1.35498046875, 1.528076171875, 1.701171875, 1.874267578125, 2.04736328125, 2.220458984375, 2.3935546875, 2.566650390625, 2.73974609375, 2.912841796875, 3.0859375, 3.259033203125, 3.43212890625, 3.605224609375, 3.7783203125, 3.951416015625, 4.12451171875, 4.297607421875, 4.470703125, 4.643798828125, 4.81689453125, 4.989990234375, 5.1630859375, 5.336181640625, 5.50927734375, 5.682373046875, 5.85546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 6.0, 12.0, 14.0, 16.0, 17.0, 33.0, 42.0, 53.0, 77.0, 101.0, 102.0, 89.0, 105.0, 70.0, 71.0, 54.0, 34.0, 29.0, 23.0, 18.0, 10.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90966796875, -0.8845901489257812, -0.8595123291015625, -0.8344345092773438, -0.809356689453125, -0.7842788696289062, -0.7592010498046875, -0.7341232299804688, -0.70904541015625, -0.6839675903320312, -0.6588897705078125, -0.6338119506835938, -0.608734130859375, -0.5836563110351562, -0.5585784912109375, -0.5335006713867188, -0.5084228515625, -0.48334503173828125, -0.4582672119140625, -0.43318939208984375, -0.408111572265625, -0.38303375244140625, -0.3579559326171875, -0.33287811279296875, -0.30780029296875, -0.28272247314453125, -0.2576446533203125, -0.23256683349609375, -0.207489013671875, -0.18241119384765625, -0.1573333740234375, -0.13225555419921875, -0.107177734375, -0.08209991455078125, -0.0570220947265625, -0.03194427490234375, -0.006866455078125, 0.01821136474609375, 0.0432891845703125, 0.06836700439453125, 0.09344482421875, 0.11852264404296875, 0.1436004638671875, 0.16867828369140625, 0.193756103515625, 0.21883392333984375, 0.2439117431640625, 0.26898956298828125, 0.2940673828125, 0.31914520263671875, 0.3442230224609375, 0.36930084228515625, 0.394378662109375, 0.41945648193359375, 0.4445343017578125, 0.46961212158203125, 0.49468994140625, 0.5197677612304688, 0.5448455810546875, 0.5699234008789062, 0.595001220703125, 0.6200790405273438, 0.6451568603515625, 0.6702346801757812, 0.6953125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 21.0, 20.0, 37.0, 52.0, 62.0, 86.0, 106.0, 132.0, 116.0, 108.0, 77.0, 53.0, 45.0, 23.0, 15.0, 12.0, 8.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.724215507507324, -11.343389511108398, -10.962564468383789, -10.58173942565918, -10.200913429260254, -9.820087432861328, -9.439262390136719, -9.05843734741211, -8.677611351013184, -8.296785354614258, -7.915960311889648, -7.535134792327881, -7.154309272766113, -6.773483753204346, -6.392658233642578, -6.0118327140808105, -5.631007194519043, -5.250181674957275, -4.869356155395508, -4.48853063583374, -4.107705116271973, -3.726879596710205, -3.3460540771484375, -2.96522855758667, -2.5844030380249023, -2.2035775184631348, -1.8227519989013672, -1.4419264793395996, -1.061100959777832, -0.6802754402160645, -0.2994499206542969, 0.0813755989074707, 0.4622011184692383, 0.8430266380310059, 1.2238521575927734, 1.604677677154541, 1.9855031967163086, 2.366328716278076, 2.7471542358398438, 3.1279797554016113, 3.508805274963379, 3.8896307945251465, 4.270456314086914, 4.651281833648682, 5.032107353210449, 5.412932872772217, 5.793758392333984, 6.174583911895752, 6.5554094314575195, 6.936234951019287, 7.317060470581055, 7.697885990142822, 8.07871150970459, 8.459537506103516, 8.840362548828125, 9.221187591552734, 9.60201358795166, 9.982839584350586, 10.363664627075195, 10.744489669799805, 11.12531566619873, 11.506141662597656, 11.886966705322266, 12.267791748046875, 12.6486177444458]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 8.0, 9.0, 11.0, 16.0, 22.0, 25.0, 27.0, 32.0, 21.0, 42.0, 50.0, 38.0, 57.0, 47.0, 43.0, 46.0, 48.0, 54.0, 48.0, 31.0, 43.0, 43.0, 30.0, 20.0, 25.0, 22.0, 26.0, 16.0, 26.0, 20.0, 9.0, 5.0, 7.0, 3.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.660863399505615, -6.4587483406066895, -6.2566328048706055, -6.05451774597168, -5.852402687072754, -5.650287628173828, -5.448172569274902, -5.246057033538818, -5.043941974639893, -4.841826915740967, -4.639711380004883, -4.437596321105957, -4.235481262207031, -4.0333662033081055, -3.8312509059906006, -3.6291356086730957, -3.42702054977417, -3.224905490875244, -3.0227901935577393, -2.8206748962402344, -2.6185598373413086, -2.416444778442383, -2.214329481124878, -2.012214183807373, -1.8100991249084473, -1.607983946800232, -1.4058687686920166, -1.2037535905838013, -1.001638412475586, -0.7995232343673706, -0.5974080562591553, -0.39529287815093994, -0.1931777000427246, 0.008937478065490723, 0.21105265617370605, 0.4131678342819214, 0.6152830123901367, 0.817398190498352, 1.0195133686065674, 1.2216285467147827, 1.423743724822998, 1.6258589029312134, 1.8279740810394287, 2.0300893783569336, 2.2322044372558594, 2.434319496154785, 2.63643479347229, 2.838550090789795, 3.0406651496887207, 3.2427802085876465, 3.4448955059051514, 3.6470108032226562, 3.849125862121582, 4.051240921020508, 4.253355979919434, 4.455471515655518, 4.657586574554443, 4.859701633453369, 5.061817169189453, 5.263932228088379, 5.466047286987305, 5.6681623458862305, 5.870277404785156, 6.07239294052124, 6.274507999420166]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 6.0, 6.0, 8.0, 28.0, 39.0, 68.0, 148.0, 288.0, 552.0, 1060.0, 2181.0, 4716.0, 10863.0, 27660.0, 80539.0, 304231.0, 433970.0, 117962.0, 38281.0, 14468.0, 6153.0, 2650.0, 1327.0, 653.0, 306.0, 165.0, 96.0, 51.0, 32.0, 18.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.109375, -5.92510986328125, -5.7408447265625, -5.55657958984375, -5.372314453125, -5.18804931640625, -5.0037841796875, -4.81951904296875, -4.63525390625, -4.45098876953125, -4.2667236328125, -4.08245849609375, -3.898193359375, -3.71392822265625, -3.5296630859375, -3.34539794921875, -3.1611328125, -2.97686767578125, -2.7926025390625, -2.60833740234375, -2.424072265625, -2.23980712890625, -2.0555419921875, -1.87127685546875, -1.68701171875, -1.50274658203125, -1.3184814453125, -1.13421630859375, -0.949951171875, -0.76568603515625, -0.5814208984375, -0.39715576171875, -0.212890625, -0.02862548828125, 0.1556396484375, 0.33990478515625, 0.524169921875, 0.70843505859375, 0.8927001953125, 1.07696533203125, 1.26123046875, 1.44549560546875, 1.6297607421875, 1.81402587890625, 1.998291015625, 2.18255615234375, 2.3668212890625, 2.55108642578125, 2.7353515625, 2.91961669921875, 3.1038818359375, 3.28814697265625, 3.472412109375, 3.65667724609375, 3.8409423828125, 4.02520751953125, 4.20947265625, 4.39373779296875, 4.5780029296875, 4.76226806640625, 4.946533203125, 5.13079833984375, 5.3150634765625, 5.49932861328125, 5.68359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 11.0, 3.0, 10.0, 8.0, 6.0, 18.0, 18.0, 14.0, 19.0, 20.0, 23.0, 33.0, 27.0, 43.0, 27.0, 39.0, 49.0, 38.0, 47.0, 48.0, 57.0, 46.0, 50.0, 41.0, 38.0, 29.0, 28.0, 34.0, 29.0, 14.0, 28.0, 27.0, 22.0, 12.0, 11.0, 6.0, 4.0, 7.0, 3.0, 7.0, 8.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-21.515625, -20.946044921875, -20.37646484375, -19.806884765625, -19.2373046875, -18.667724609375, -18.09814453125, -17.528564453125, -16.958984375, -16.389404296875, -15.81982421875, -15.250244140625, -14.6806640625, -14.111083984375, -13.54150390625, -12.971923828125, -12.40234375, -11.832763671875, -11.26318359375, -10.693603515625, -10.1240234375, -9.554443359375, -8.98486328125, -8.415283203125, -7.845703125, -7.276123046875, -6.70654296875, -6.136962890625, -5.5673828125, -4.997802734375, -4.42822265625, -3.858642578125, -3.2890625, -2.719482421875, -2.14990234375, -1.580322265625, -1.0107421875, -0.441162109375, 0.12841796875, 0.697998046875, 1.267578125, 1.837158203125, 2.40673828125, 2.976318359375, 3.5458984375, 4.115478515625, 4.68505859375, 5.254638671875, 5.82421875, 6.393798828125, 6.96337890625, 7.532958984375, 8.1025390625, 8.672119140625, 9.24169921875, 9.811279296875, 10.380859375, 10.950439453125, 11.52001953125, 12.089599609375, 12.6591796875, 13.228759765625, 13.79833984375, 14.367919921875, 14.9375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 5.0, 7.0, 5.0, 11.0, 9.0, 16.0, 26.0, 26.0, 24.0, 29.0, 23.0, 39.0, 61.0, 80.0, 98.0, 149.0, 585.0, 1031426.0, 15200.0, 251.0, 118.0, 73.0, 62.0, 42.0, 33.0, 24.0, 26.0, 23.0, 18.0, 8.0, 9.0, 6.0, 8.0, 7.0, 6.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.4375, -65.24609375, -63.0546875, -60.86328125, -58.671875, -56.48046875, -54.2890625, -52.09765625, -49.90625, -47.71484375, -45.5234375, -43.33203125, -41.140625, -38.94921875, -36.7578125, -34.56640625, -32.375, -30.18359375, -27.9921875, -25.80078125, -23.609375, -21.41796875, -19.2265625, -17.03515625, -14.84375, -12.65234375, -10.4609375, -8.26953125, -6.078125, -3.88671875, -1.6953125, 0.49609375, 2.6875, 4.87890625, 7.0703125, 9.26171875, 11.453125, 13.64453125, 15.8359375, 18.02734375, 20.21875, 22.41015625, 24.6015625, 26.79296875, 28.984375, 31.17578125, 33.3671875, 35.55859375, 37.75, 39.94140625, 42.1328125, 44.32421875, 46.515625, 48.70703125, 50.8984375, 53.08984375, 55.28125, 57.47265625, 59.6640625, 61.85546875, 64.046875, 66.23828125, 68.4296875, 70.62109375, 72.8125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 0.0, 4.0, 5.0, 8.0, 2.0, 13.0, 7.0, 21.0, 23.0, 23.0, 27.0, 26.0, 28.0, 30.0, 53.0, 59.0, 61.0, 55.0, 52.0, 60.0, 41.0, 56.0, 38.0, 50.0, 40.0, 32.0, 28.0, 29.0, 26.0, 22.0, 20.0, 8.0, 8.0, 6.0, 7.0, 9.0, 8.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.390625, -21.66552734375, -20.9404296875, -20.21533203125, -19.490234375, -18.76513671875, -18.0400390625, -17.31494140625, -16.58984375, -15.86474609375, -15.1396484375, -14.41455078125, -13.689453125, -12.96435546875, -12.2392578125, -11.51416015625, -10.7890625, -10.06396484375, -9.3388671875, -8.61376953125, -7.888671875, -7.16357421875, -6.4384765625, -5.71337890625, -4.98828125, -4.26318359375, -3.5380859375, -2.81298828125, -2.087890625, -1.36279296875, -0.6376953125, 0.08740234375, 0.8125, 1.53759765625, 2.2626953125, 2.98779296875, 3.712890625, 4.43798828125, 5.1630859375, 5.88818359375, 6.61328125, 7.33837890625, 8.0634765625, 8.78857421875, 9.513671875, 10.23876953125, 10.9638671875, 11.68896484375, 12.4140625, 13.13916015625, 13.8642578125, 14.58935546875, 15.314453125, 16.03955078125, 16.7646484375, 17.48974609375, 18.21484375, 18.93994140625, 19.6650390625, 20.39013671875, 21.115234375, 21.84033203125, 22.5654296875, 23.29052734375, 24.015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 9.0, 3.0, 8.0, 7.0, 12.0, 15.0, 27.0, 33.0, 82.0, 173.0, 533.0, 1941.0, 13494.0, 827447.0, 194927.0, 7766.0, 1332.0, 399.0, 152.0, 71.0, 29.0, 18.0, 14.0, 15.0, 8.0, 14.0, 8.0, 1.0, 6.0, 1.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.88671875, -7.6468505859375, -7.406982421875, -7.1671142578125, -6.92724609375, -6.6873779296875, -6.447509765625, -6.2076416015625, -5.9677734375, -5.7279052734375, -5.488037109375, -5.2481689453125, -5.00830078125, -4.7684326171875, -4.528564453125, -4.2886962890625, -4.048828125, -3.8089599609375, -3.569091796875, -3.3292236328125, -3.08935546875, -2.8494873046875, -2.609619140625, -2.3697509765625, -2.1298828125, -1.8900146484375, -1.650146484375, -1.4102783203125, -1.17041015625, -0.9305419921875, -0.690673828125, -0.4508056640625, -0.2109375, 0.0289306640625, 0.268798828125, 0.5086669921875, 0.74853515625, 0.9884033203125, 1.228271484375, 1.4681396484375, 1.7080078125, 1.9478759765625, 2.187744140625, 2.4276123046875, 2.66748046875, 2.9073486328125, 3.147216796875, 3.3870849609375, 3.626953125, 3.8668212890625, 4.106689453125, 4.3465576171875, 4.58642578125, 4.8262939453125, 5.066162109375, 5.3060302734375, 5.5458984375, 5.7857666015625, 6.025634765625, 6.2655029296875, 6.50537109375, 6.7452392578125, 6.985107421875, 7.2249755859375, 7.46484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 4.0, 8.0, 11.0, 22.0, 36.0, 60.0, 96.0, 241.0, 219.0, 118.0, 57.0, 40.0, 24.0, 15.0, 14.0, 6.0, 3.0, 11.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000522613525390625, -0.0005025789141654968, -0.00048254430294036865, -0.0004625096917152405, -0.0004424750804901123, -0.00042244046926498413, -0.00040240585803985596, -0.0003823712468147278, -0.0003623366355895996, -0.00034230202436447144, -0.00032226741313934326, -0.0003022328019142151, -0.0002821981906890869, -0.00026216357946395874, -0.00024212896823883057, -0.0002220943570137024, -0.00020205974578857422, -0.00018202513456344604, -0.00016199052333831787, -0.0001419559121131897, -0.00012192130088806152, -0.00010188668966293335, -8.185207843780518e-05, -6.1817467212677e-05, -4.178285598754883e-05, -2.1748244762420654e-05, -1.7136335372924805e-06, 1.8320977687835693e-05, 3.835558891296387e-05, 5.839020013809204e-05, 7.842481136322021e-05, 9.845942258834839e-05, 0.00011849403381347656, 0.00013852864503860474, 0.0001585632562637329, 0.00017859786748886108, 0.00019863247871398926, 0.00021866708993911743, 0.0002387017011642456, 0.0002587363123893738, 0.00027877092361450195, 0.0002988055348396301, 0.0003188401460647583, 0.0003388747572898865, 0.00035890936851501465, 0.0003789439797401428, 0.000398978590965271, 0.00041901320219039917, 0.00043904781341552734, 0.0004590824246406555, 0.0004791170358657837, 0.0004991516470909119, 0.00051918625831604, 0.0005392208695411682, 0.0005592554807662964, 0.0005792900919914246, 0.0005993247032165527, 0.0006193593144416809, 0.0006393939256668091, 0.0006594285368919373, 0.0006794631481170654, 0.0006994977593421936, 0.0007195323705673218, 0.00073956698179245, 0.0007596015930175781]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 9.0, 3.0, 11.0, 18.0, 27.0, 42.0, 77.0, 133.0, 378.0, 1425.0, 6823.0, 85709.0, 920048.0, 28552.0, 3791.0, 943.0, 249.0, 131.0, 67.0, 35.0, 21.0, 19.0, 13.0, 5.0, 4.0, 2.0, 2.0, 2.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.73828125, -7.5252685546875, -7.312255859375, -7.0992431640625, -6.88623046875, -6.6732177734375, -6.460205078125, -6.2471923828125, -6.0341796875, -5.8211669921875, -5.608154296875, -5.3951416015625, -5.18212890625, -4.9691162109375, -4.756103515625, -4.5430908203125, -4.330078125, -4.1170654296875, -3.904052734375, -3.6910400390625, -3.47802734375, -3.2650146484375, -3.052001953125, -2.8389892578125, -2.6259765625, -2.4129638671875, -2.199951171875, -1.9869384765625, -1.77392578125, -1.5609130859375, -1.347900390625, -1.1348876953125, -0.921875, -0.7088623046875, -0.495849609375, -0.2828369140625, -0.06982421875, 0.1431884765625, 0.356201171875, 0.5692138671875, 0.7822265625, 0.9952392578125, 1.208251953125, 1.4212646484375, 1.63427734375, 1.8472900390625, 2.060302734375, 2.2733154296875, 2.486328125, 2.6993408203125, 2.912353515625, 3.1253662109375, 3.33837890625, 3.5513916015625, 3.764404296875, 3.9774169921875, 4.1904296875, 4.4034423828125, 4.616455078125, 4.8294677734375, 5.04248046875, 5.2554931640625, 5.468505859375, 5.6815185546875, 5.89453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 7.0, 3.0, 16.0, 19.0, 23.0, 35.0, 51.0, 97.0, 211.0, 253.0, 87.0, 55.0, 39.0, 27.0, 18.0, 9.0, 15.0, 4.0, 2.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0134429931640625, -0.965362548828125, -0.9172821044921875, -0.86920166015625, -0.8211212158203125, -0.773040771484375, -0.7249603271484375, -0.6768798828125, -0.6287994384765625, -0.580718994140625, -0.5326385498046875, -0.48455810546875, -0.4364776611328125, -0.388397216796875, -0.3403167724609375, -0.292236328125, -0.2441558837890625, -0.196075439453125, -0.1479949951171875, -0.09991455078125, -0.0518341064453125, -0.003753662109375, 0.0443267822265625, 0.0924072265625, 0.1404876708984375, 0.188568115234375, 0.2366485595703125, 0.28472900390625, 0.3328094482421875, 0.380889892578125, 0.4289703369140625, 0.47705078125, 0.5251312255859375, 0.573211669921875, 0.6212921142578125, 0.66937255859375, 0.7174530029296875, 0.765533447265625, 0.8136138916015625, 0.8616943359375, 0.9097747802734375, 0.957855224609375, 1.0059356689453125, 1.05401611328125, 1.1020965576171875, 1.150177001953125, 1.1982574462890625, 1.246337890625, 1.2944183349609375, 1.342498779296875, 1.3905792236328125, 1.43865966796875, 1.4867401123046875, 1.534820556640625, 1.5829010009765625, 1.6309814453125, 1.6790618896484375, 1.727142333984375, 1.7752227783203125, 1.82330322265625, 1.8713836669921875, 1.919464111328125, 1.9675445556640625, 2.015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 19.0, 43.0, 90.0, 148.0, 220.0, 224.0, 133.0, 71.0, 30.0, 16.0, 6.0, 9.0, 1.0, 2.0, 0.0, 2.0], "bins": [-75.38662719726562, -73.96429443359375, -72.54196166992188, -71.11962890625, -69.69729614257812, -68.27496337890625, -66.85263061523438, -65.43029022216797, -64.0079574584961, -62.58562469482422, -61.163291931152344, -59.74095916748047, -58.31862258911133, -56.89628982543945, -55.47395706176758, -54.0516242980957, -52.62929153442383, -51.20695877075195, -49.78462600708008, -48.36228942871094, -46.93995666503906, -45.51762390136719, -44.09529113769531, -42.67295837402344, -41.25062561035156, -39.82829284667969, -38.40596008300781, -36.98362731933594, -35.5612907409668, -34.13895797729492, -32.71662521362305, -31.294292449951172, -29.871959686279297, -28.449626922607422, -27.027292251586914, -25.60495948791504, -24.18262481689453, -22.760292053222656, -21.33795928955078, -19.915626525878906, -18.4932918548584, -17.070959091186523, -15.648624420166016, -14.22629165649414, -12.80395793914795, -11.381624221801758, -9.959291458129883, -8.536957740783691, -7.1146240234375, -5.692290306091309, -4.269957065582275, -2.847623825073242, -1.4252901077270508, -0.002956390380859375, 1.4193763732910156, 2.841710090637207, 4.264043807983398, 5.68637752532959, 7.108710765838623, 8.531044006347656, 9.953377723693848, 11.375711441040039, 12.798044204711914, 14.220377922058105, 15.642711639404297]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 9.0, 3.0, 7.0, 11.0, 6.0, 11.0, 15.0, 14.0, 16.0, 17.0, 27.0, 24.0, 29.0, 25.0, 34.0, 27.0, 36.0, 33.0, 44.0, 38.0, 40.0, 31.0, 43.0, 31.0, 42.0, 35.0, 35.0, 35.0, 35.0, 29.0, 25.0, 25.0, 23.0, 17.0, 23.0, 17.0, 12.0, 9.0, 10.0, 12.0, 8.0, 9.0, 9.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.943883895874023, -20.214523315429688, -19.485164642333984, -18.75580406188965, -18.026443481445312, -17.29708480834961, -16.567724227905273, -15.838364601135254, -15.109004974365234, -14.379645347595215, -13.650285720825195, -12.92092514038086, -12.19156551361084, -11.46220588684082, -10.732845306396484, -10.003485679626465, -9.274126052856445, -8.544766426086426, -7.815406322479248, -7.08604621887207, -6.356686592102051, -5.627326965332031, -4.8979668617248535, -4.168606758117676, -3.4392471313476562, -2.7098872661590576, -1.980527400970459, -1.2511675357818604, -0.5218076705932617, 0.20755219459533691, 0.9369120597839355, 1.6662721633911133, 2.3956336975097656, 3.1249935626983643, 3.854353427886963, 4.583713531494141, 5.31307315826416, 6.04243278503418, 6.771792888641357, 7.501152992248535, 8.230512619018555, 8.959872245788574, 9.689231872558594, 10.41859245300293, 11.14795207977295, 11.877311706542969, 12.606672286987305, 13.336031913757324, 14.065391540527344, 14.794751167297363, 15.524110794067383, 16.25347137451172, 16.982830047607422, 17.712190628051758, 18.441551208496094, 19.170909881591797, 19.900270462036133, 20.62963104248047, 21.358989715576172, 22.088350296020508, 22.817710876464844, 23.547069549560547, 24.276430130004883, 25.00579071044922, 25.735149383544922]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 9.0, 6.0, 3.0, 8.0, 10.0, 11.0, 24.0, 21.0, 14.0, 38.0, 27.0, 45.0, 54.0, 71.0, 140.0, 231.0, 420.0, 848.0, 1801.0, 4504.0, 13468.0, 58380.0, 604054.0, 2936426.0, 502589.0, 51062.0, 12123.0, 4202.0, 1735.0, 821.0, 448.0, 211.0, 142.0, 85.0, 66.0, 34.0, 35.0, 26.0, 11.0, 16.0, 12.0, 13.0, 11.0, 7.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 2.0], "bins": [-16.484375, -16.006103515625, -15.52783203125, -15.049560546875, -14.5712890625, -14.093017578125, -13.61474609375, -13.136474609375, -12.658203125, -12.179931640625, -11.70166015625, -11.223388671875, -10.7451171875, -10.266845703125, -9.78857421875, -9.310302734375, -8.83203125, -8.353759765625, -7.87548828125, -7.397216796875, -6.9189453125, -6.440673828125, -5.96240234375, -5.484130859375, -5.005859375, -4.527587890625, -4.04931640625, -3.571044921875, -3.0927734375, -2.614501953125, -2.13623046875, -1.657958984375, -1.1796875, -0.701416015625, -0.22314453125, 0.255126953125, 0.7333984375, 1.211669921875, 1.68994140625, 2.168212890625, 2.646484375, 3.124755859375, 3.60302734375, 4.081298828125, 4.5595703125, 5.037841796875, 5.51611328125, 5.994384765625, 6.47265625, 6.950927734375, 7.42919921875, 7.907470703125, 8.3857421875, 8.864013671875, 9.34228515625, 9.820556640625, 10.298828125, 10.777099609375, 11.25537109375, 11.733642578125, 12.2119140625, 12.690185546875, 13.16845703125, 13.646728515625, 14.125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 10.0, 6.0, 10.0, 11.0, 17.0, 23.0, 30.0, 28.0, 23.0, 35.0, 48.0, 57.0, 48.0, 57.0, 51.0, 51.0, 55.0, 58.0, 49.0, 35.0, 37.0, 30.0, 44.0, 27.0, 32.0, 23.0, 18.0, 16.0, 13.0, 16.0, 6.0, 7.0, 9.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.554443359375, -6.31201171875, -6.069580078125, -5.8271484375, -5.584716796875, -5.34228515625, -5.099853515625, -4.857421875, -4.614990234375, -4.37255859375, -4.130126953125, -3.8876953125, -3.645263671875, -3.40283203125, -3.160400390625, -2.91796875, -2.675537109375, -2.43310546875, -2.190673828125, -1.9482421875, -1.705810546875, -1.46337890625, -1.220947265625, -0.978515625, -0.736083984375, -0.49365234375, -0.251220703125, -0.0087890625, 0.233642578125, 0.47607421875, 0.718505859375, 0.9609375, 1.203369140625, 1.44580078125, 1.688232421875, 1.9306640625, 2.173095703125, 2.41552734375, 2.657958984375, 2.900390625, 3.142822265625, 3.38525390625, 3.627685546875, 3.8701171875, 4.112548828125, 4.35498046875, 4.597412109375, 4.83984375, 5.082275390625, 5.32470703125, 5.567138671875, 5.8095703125, 6.052001953125, 6.29443359375, 6.536865234375, 6.779296875, 7.021728515625, 7.26416015625, 7.506591796875, 7.7490234375, 7.991455078125, 8.23388671875, 8.476318359375, 8.71875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 8.0, 17.0, 24.0, 33.0, 70.0, 186.0, 646.0, 14710.0, 4169045.0, 8597.0, 568.0, 186.0, 69.0, 25.0, 21.0, 13.0, 12.0, 6.0, 6.0, 4.0, 0.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-83.8125, -81.3798828125, -78.947265625, -76.5146484375, -74.08203125, -71.6494140625, -69.216796875, -66.7841796875, -64.3515625, -61.9189453125, -59.486328125, -57.0537109375, -54.62109375, -52.1884765625, -49.755859375, -47.3232421875, -44.890625, -42.4580078125, -40.025390625, -37.5927734375, -35.16015625, -32.7275390625, -30.294921875, -27.8623046875, -25.4296875, -22.9970703125, -20.564453125, -18.1318359375, -15.69921875, -13.2666015625, -10.833984375, -8.4013671875, -5.96875, -3.5361328125, -1.103515625, 1.3291015625, 3.76171875, 6.1943359375, 8.626953125, 11.0595703125, 13.4921875, 15.9248046875, 18.357421875, 20.7900390625, 23.22265625, 25.6552734375, 28.087890625, 30.5205078125, 32.953125, 35.3857421875, 37.818359375, 40.2509765625, 42.68359375, 45.1162109375, 47.548828125, 49.9814453125, 52.4140625, 54.8466796875, 57.279296875, 59.7119140625, 62.14453125, 64.5771484375, 67.009765625, 69.4423828125, 71.875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 13.0, 10.0, 15.0, 25.0, 57.0, 39.0, 88.0, 118.0, 182.0, 321.0, 562.0, 815.0, 719.0, 396.0, 238.0, 139.0, 107.0, 50.0, 58.0, 31.0, 28.0, 17.0, 9.0, 3.0, 8.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.2515869140625, -4.108642578125, -3.9656982421875, -3.82275390625, -3.6798095703125, -3.536865234375, -3.3939208984375, -3.2509765625, -3.1080322265625, -2.965087890625, -2.8221435546875, -2.67919921875, -2.5362548828125, -2.393310546875, -2.2503662109375, -2.107421875, -1.9644775390625, -1.821533203125, -1.6785888671875, -1.53564453125, -1.3927001953125, -1.249755859375, -1.1068115234375, -0.9638671875, -0.8209228515625, -0.677978515625, -0.5350341796875, -0.39208984375, -0.2491455078125, -0.106201171875, 0.0367431640625, 0.1796875, 0.3226318359375, 0.465576171875, 0.6085205078125, 0.75146484375, 0.8944091796875, 1.037353515625, 1.1802978515625, 1.3232421875, 1.4661865234375, 1.609130859375, 1.7520751953125, 1.89501953125, 2.0379638671875, 2.180908203125, 2.3238525390625, 2.466796875, 2.6097412109375, 2.752685546875, 2.8956298828125, 3.03857421875, 3.1815185546875, 3.324462890625, 3.4674072265625, 3.6103515625, 3.7532958984375, 3.896240234375, 4.0391845703125, 4.18212890625, 4.3250732421875, 4.468017578125, 4.6109619140625, 4.75390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 15.0, 23.0, 23.0, 24.0, 49.0, 42.0, 51.0, 65.0, 87.0, 93.0, 80.0, 79.0, 77.0, 55.0, 54.0, 39.0, 26.0, 17.0, 23.0, 17.0, 11.0, 13.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.073370933532715, -7.675901412963867, -7.2784318923950195, -6.880961894989014, -6.483492374420166, -6.086022853851318, -5.6885528564453125, -5.291083335876465, -4.893613815307617, -4.4961442947387695, -4.098674774169922, -3.701204776763916, -3.3037352561950684, -2.9062657356262207, -2.508795976638794, -2.111326217651367, -1.7138566970825195, -1.3163870573043823, -0.9189174175262451, -0.5214477777481079, -0.1239781379699707, 0.2734915018081665, 0.6709611415863037, 1.0684309005737305, 1.4659004211425781, 1.8633700609207153, 2.2608397006988525, 2.6583094596862793, 3.055778980255127, 3.4532485008239746, 3.8507182598114014, 4.248188018798828, 4.645656585693359, 5.043126106262207, 5.440595626831055, 5.8380656242370605, 6.235535144805908, 6.633004665374756, 7.030474662780762, 7.427944183349609, 7.825413703918457, 8.222883224487305, 8.620352745056152, 9.017822265625, 9.415292739868164, 9.812762260437012, 10.21023178100586, 10.607701301574707, 11.005170822143555, 11.402640342712402, 11.80010986328125, 12.197579383850098, 12.595048904418945, 12.99251937866211, 13.389988899230957, 13.787458419799805, 14.184927940368652, 14.5823974609375, 14.979866981506348, 15.377336502075195, 15.77480697631836, 16.17227554321289, 16.569746017456055, 16.96721649169922, 17.36468505859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 8.0, 4.0, 7.0, 9.0, 12.0, 12.0, 11.0, 13.0, 27.0, 30.0, 24.0, 32.0, 31.0, 48.0, 51.0, 37.0, 53.0, 51.0, 47.0, 45.0, 53.0, 43.0, 37.0, 40.0, 45.0, 32.0, 28.0, 21.0, 29.0, 25.0, 20.0, 10.0, 12.0, 15.0, 5.0, 9.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.543779373168945, -9.275174140930176, -9.00656795501709, -8.73796272277832, -8.469356536865234, -8.200751304626465, -7.932145595550537, -7.663539886474609, -7.394934177398682, -7.126328468322754, -6.857722759246826, -6.589117050170898, -6.320511817932129, -6.051905632019043, -5.783300399780273, -5.514694690704346, -5.246088981628418, -4.97748327255249, -4.7088775634765625, -4.440271854400635, -4.171666145324707, -3.9030606746673584, -3.6344552040100098, -3.365849494934082, -3.0972437858581543, -2.8286380767822266, -2.560032367706299, -2.29142689704895, -2.0228211879730225, -1.7542154788970947, -1.4856098890304565, -1.2170042991638184, -0.9483985900878906, -0.6797929406166077, -0.4111872911453247, -0.14258164167404175, 0.1260240077972412, 0.39462971687316895, 0.6632353067398071, 0.9318408966064453, 1.200446605682373, 1.4690523147583008, 1.737657904624939, 2.006263494491577, 2.274869203567505, 2.5434749126434326, 2.8120803833007812, 3.080686092376709, 3.3492918014526367, 3.6178975105285645, 3.886503219604492, 4.15510892868042, 4.423714637756348, 4.692319869995117, 4.960925579071045, 5.229531288146973, 5.4981369972229, 5.766742706298828, 6.035348415374756, 6.303954124450684, 6.572559356689453, 6.841165542602539, 7.109770774841309, 7.378376483917236, 7.646982192993164]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 6.0, 8.0, 18.0, 33.0, 44.0, 63.0, 132.0, 177.0, 342.0, 672.0, 1211.0, 2879.0, 7302.0, 19405.0, 57460.0, 189373.0, 409608.0, 244149.0, 75370.0, 24311.0, 8977.0, 3651.0, 1627.0, 777.0, 405.0, 215.0, 124.0, 67.0, 41.0, 23.0, 26.0, 12.0, 11.0, 3.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.9453125, -3.80743408203125, -3.6695556640625, -3.53167724609375, -3.393798828125, -3.25592041015625, -3.1180419921875, -2.98016357421875, -2.84228515625, -2.70440673828125, -2.5665283203125, -2.42864990234375, -2.290771484375, -2.15289306640625, -2.0150146484375, -1.87713623046875, -1.7392578125, -1.60137939453125, -1.4635009765625, -1.32562255859375, -1.187744140625, -1.04986572265625, -0.9119873046875, -0.77410888671875, -0.63623046875, -0.49835205078125, -0.3604736328125, -0.22259521484375, -0.084716796875, 0.05316162109375, 0.1910400390625, 0.32891845703125, 0.466796875, 0.60467529296875, 0.7425537109375, 0.88043212890625, 1.018310546875, 1.15618896484375, 1.2940673828125, 1.43194580078125, 1.56982421875, 1.70770263671875, 1.8455810546875, 1.98345947265625, 2.121337890625, 2.25921630859375, 2.3970947265625, 2.53497314453125, 2.6728515625, 2.81072998046875, 2.9486083984375, 3.08648681640625, 3.224365234375, 3.36224365234375, 3.5001220703125, 3.63800048828125, 3.77587890625, 3.91375732421875, 4.0516357421875, 4.18951416015625, 4.327392578125, 4.46527099609375, 4.6031494140625, 4.74102783203125, 4.87890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 11.0, 16.0, 22.0, 28.0, 43.0, 27.0, 33.0, 57.0, 73.0, 67.0, 62.0, 78.0, 71.0, 68.0, 70.0, 56.0, 39.0, 41.0, 31.0, 27.0, 19.0, 10.0, 11.0, 12.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-9.5703125, -9.3453369140625, -9.120361328125, -8.8953857421875, -8.67041015625, -8.4454345703125, -8.220458984375, -7.9954833984375, -7.7705078125, -7.5455322265625, -7.320556640625, -7.0955810546875, -6.87060546875, -6.6456298828125, -6.420654296875, -6.1956787109375, -5.970703125, -5.7457275390625, -5.520751953125, -5.2957763671875, -5.07080078125, -4.8458251953125, -4.620849609375, -4.3958740234375, -4.1708984375, -3.9459228515625, -3.720947265625, -3.4959716796875, -3.27099609375, -3.0460205078125, -2.821044921875, -2.5960693359375, -2.37109375, -2.1461181640625, -1.921142578125, -1.6961669921875, -1.47119140625, -1.2462158203125, -1.021240234375, -0.7962646484375, -0.5712890625, -0.3463134765625, -0.121337890625, 0.1036376953125, 0.32861328125, 0.5535888671875, 0.778564453125, 1.0035400390625, 1.228515625, 1.4534912109375, 1.678466796875, 1.9034423828125, 2.12841796875, 2.3533935546875, 2.578369140625, 2.8033447265625, 3.0283203125, 3.2532958984375, 3.478271484375, 3.7032470703125, 3.92822265625, 4.1531982421875, 4.378173828125, 4.6031494140625, 4.828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 7.0, 10.0, 18.0, 18.0, 36.0, 43.0, 57.0, 97.0, 161.0, 236.0, 440.0, 767.0, 1468.0, 2849.0, 6490.0, 15294.0, 40138.0, 114079.0, 289434.0, 336983.0, 151355.0, 53274.0, 19697.0, 8098.0, 3620.0, 1782.0, 874.0, 437.0, 274.0, 169.0, 115.0, 71.0, 57.0, 29.0, 19.0, 17.0, 10.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0546875, -2.953338623046875, -2.85198974609375, -2.750640869140625, -2.6492919921875, -2.547943115234375, -2.44659423828125, -2.345245361328125, -2.243896484375, -2.142547607421875, -2.04119873046875, -1.939849853515625, -1.8385009765625, -1.737152099609375, -1.63580322265625, -1.534454345703125, -1.43310546875, -1.331756591796875, -1.23040771484375, -1.129058837890625, -1.0277099609375, -0.926361083984375, -0.82501220703125, -0.723663330078125, -0.622314453125, -0.520965576171875, -0.41961669921875, -0.318267822265625, -0.2169189453125, -0.115570068359375, -0.01422119140625, 0.087127685546875, 0.1884765625, 0.289825439453125, 0.39117431640625, 0.492523193359375, 0.5938720703125, 0.695220947265625, 0.79656982421875, 0.897918701171875, 0.999267578125, 1.100616455078125, 1.20196533203125, 1.303314208984375, 1.4046630859375, 1.506011962890625, 1.60736083984375, 1.708709716796875, 1.81005859375, 1.911407470703125, 2.01275634765625, 2.114105224609375, 2.2154541015625, 2.316802978515625, 2.41815185546875, 2.519500732421875, 2.620849609375, 2.722198486328125, 2.82354736328125, 2.924896240234375, 3.0262451171875, 3.127593994140625, 3.22894287109375, 3.330291748046875, 3.431640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 10.0, 16.0, 16.0, 10.0, 20.0, 21.0, 21.0, 22.0, 33.0, 35.0, 35.0, 33.0, 43.0, 46.0, 37.0, 51.0, 47.0, 39.0, 44.0, 35.0, 53.0, 47.0, 54.0, 37.0, 33.0, 25.0, 15.0, 13.0, 18.0, 13.0, 23.0, 14.0, 9.0, 9.0, 5.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.3515625, -9.052001953125, -8.75244140625, -8.452880859375, -8.1533203125, -7.853759765625, -7.55419921875, -7.254638671875, -6.955078125, -6.655517578125, -6.35595703125, -6.056396484375, -5.7568359375, -5.457275390625, -5.15771484375, -4.858154296875, -4.55859375, -4.259033203125, -3.95947265625, -3.659912109375, -3.3603515625, -3.060791015625, -2.76123046875, -2.461669921875, -2.162109375, -1.862548828125, -1.56298828125, -1.263427734375, -0.9638671875, -0.664306640625, -0.36474609375, -0.065185546875, 0.234375, 0.533935546875, 0.83349609375, 1.133056640625, 1.4326171875, 1.732177734375, 2.03173828125, 2.331298828125, 2.630859375, 2.930419921875, 3.22998046875, 3.529541015625, 3.8291015625, 4.128662109375, 4.42822265625, 4.727783203125, 5.02734375, 5.326904296875, 5.62646484375, 5.926025390625, 6.2255859375, 6.525146484375, 6.82470703125, 7.124267578125, 7.423828125, 7.723388671875, 8.02294921875, 8.322509765625, 8.6220703125, 8.921630859375, 9.22119140625, 9.520751953125, 9.8203125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 22.0, 24.0, 26.0, 61.0, 84.0, 133.0, 222.0, 360.0, 632.0, 1187.0, 2422.0, 5554.0, 13747.0, 40821.0, 137787.0, 379564.0, 314916.0, 100558.0, 30910.0, 10667.0, 4399.0, 2019.0, 1048.0, 542.0, 308.0, 177.0, 127.0, 58.0, 55.0, 25.0, 17.0, 20.0, 9.0, 14.0, 8.0, 8.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.2393035888671875, -1.196380615234375, -1.1534576416015625, -1.11053466796875, -1.0676116943359375, -1.024688720703125, -0.9817657470703125, -0.9388427734375, -0.8959197998046875, -0.852996826171875, -0.8100738525390625, -0.76715087890625, -0.7242279052734375, -0.681304931640625, -0.6383819580078125, -0.595458984375, -0.5525360107421875, -0.509613037109375, -0.4666900634765625, -0.42376708984375, -0.3808441162109375, -0.337921142578125, -0.2949981689453125, -0.2520751953125, -0.2091522216796875, -0.166229248046875, -0.1233062744140625, -0.08038330078125, -0.0374603271484375, 0.005462646484375, 0.0483856201171875, 0.09130859375, 0.1342315673828125, 0.177154541015625, 0.2200775146484375, 0.26300048828125, 0.3059234619140625, 0.348846435546875, 0.3917694091796875, 0.4346923828125, 0.4776153564453125, 0.520538330078125, 0.5634613037109375, 0.60638427734375, 0.6493072509765625, 0.692230224609375, 0.7351531982421875, 0.778076171875, 0.8209991455078125, 0.863922119140625, 0.9068450927734375, 0.94976806640625, 0.9926910400390625, 1.035614013671875, 1.0785369873046875, 1.1214599609375, 1.1643829345703125, 1.207305908203125, 1.2502288818359375, 1.29315185546875, 1.3360748291015625, 1.378997802734375, 1.4219207763671875, 1.46484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 7.0, 14.0, 17.0, 14.0, 16.0, 25.0, 25.0, 33.0, 48.0, 45.0, 62.0, 62.0, 61.0, 72.0, 55.0, 53.0, 54.0, 49.0, 46.0, 40.0, 29.0, 28.0, 28.0, 17.0, 15.0, 13.0, 13.0, 8.0, 8.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0006613731384277344, -0.000642724335193634, -0.0006240755319595337, -0.0006054267287254333, -0.000586777925491333, -0.0005681291222572327, -0.0005494803190231323, -0.000530831515789032, -0.0005121827125549316, -0.0004935339093208313, -0.00047488510608673096, -0.0004562363028526306, -0.0004375874996185303, -0.00041893869638442993, -0.0004002898931503296, -0.00038164108991622925, -0.0003629922866821289, -0.00034434348344802856, -0.0003256946802139282, -0.0003070458769798279, -0.00028839707374572754, -0.0002697482705116272, -0.00025109946727752686, -0.00023245066404342651, -0.00021380186080932617, -0.00019515305757522583, -0.0001765042543411255, -0.00015785545110702515, -0.0001392066478729248, -0.00012055784463882446, -0.00010190904140472412, -8.326023817062378e-05, -6.461143493652344e-05, -4.5962631702423096e-05, -2.7313828468322754e-05, -8.665025234222412e-06, 9.98377799987793e-06, 2.863258123397827e-05, 4.728138446807861e-05, 6.593018770217896e-05, 8.45789909362793e-05, 0.00010322779417037964, 0.00012187659740447998, 0.00014052540063858032, 0.00015917420387268066, 0.000177823007106781, 0.00019647181034088135, 0.0002151206135749817, 0.00023376941680908203, 0.0002524182200431824, 0.0002710670232772827, 0.00028971582651138306, 0.0003083646297454834, 0.00032701343297958374, 0.0003456622362136841, 0.0003643110394477844, 0.00038295984268188477, 0.0004016086459159851, 0.00042025744915008545, 0.0004389062523841858, 0.00045755505561828613, 0.0004762038588523865, 0.0004948526620864868, 0.0005135014653205872, 0.0005321502685546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 4.0, 2.0, 9.0, 8.0, 12.0, 17.0, 19.0, 27.0, 36.0, 58.0, 104.0, 137.0, 241.0, 389.0, 855.0, 1667.0, 3760.0, 9211.0, 26434.0, 86762.0, 270397.0, 393501.0, 174045.0, 52484.0, 16608.0, 6226.0, 2729.0, 1268.0, 607.0, 369.0, 207.0, 124.0, 64.0, 53.0, 25.0, 28.0, 20.0, 14.0, 11.0, 6.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.349609375, -1.3078155517578125, -1.266021728515625, -1.2242279052734375, -1.18243408203125, -1.1406402587890625, -1.098846435546875, -1.0570526123046875, -1.0152587890625, -0.9734649658203125, -0.931671142578125, -0.8898773193359375, -0.84808349609375, -0.8062896728515625, -0.764495849609375, -0.7227020263671875, -0.680908203125, -0.6391143798828125, -0.597320556640625, -0.5555267333984375, -0.51373291015625, -0.4719390869140625, -0.430145263671875, -0.3883514404296875, -0.3465576171875, -0.3047637939453125, -0.262969970703125, -0.2211761474609375, -0.17938232421875, -0.1375885009765625, -0.095794677734375, -0.0540008544921875, -0.01220703125, 0.0295867919921875, 0.071380615234375, 0.1131744384765625, 0.15496826171875, 0.1967620849609375, 0.238555908203125, 0.2803497314453125, 0.3221435546875, 0.3639373779296875, 0.405731201171875, 0.4475250244140625, 0.48931884765625, 0.5311126708984375, 0.572906494140625, 0.6147003173828125, 0.656494140625, 0.6982879638671875, 0.740081787109375, 0.7818756103515625, 0.82366943359375, 0.8654632568359375, 0.907257080078125, 0.9490509033203125, 0.9908447265625, 1.0326385498046875, 1.074432373046875, 1.1162261962890625, 1.15802001953125, 1.1998138427734375, 1.241607666015625, 1.2834014892578125, 1.3251953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 4.0, 5.0, 6.0, 7.0, 6.0, 12.0, 22.0, 12.0, 26.0, 22.0, 27.0, 23.0, 46.0, 27.0, 38.0, 70.0, 52.0, 59.0, 56.0, 57.0, 70.0, 53.0, 54.0, 37.0, 45.0, 26.0, 25.0, 16.0, 24.0, 18.0, 18.0, 8.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.304931640625, -0.2956962585449219, -0.28646087646484375, -0.2772254943847656, -0.2679901123046875, -0.2587547302246094, -0.24951934814453125, -0.24028396606445312, -0.231048583984375, -0.22181320190429688, -0.21257781982421875, -0.20334243774414062, -0.1941070556640625, -0.18487167358398438, -0.17563629150390625, -0.16640090942382812, -0.15716552734375, -0.14793014526367188, -0.13869476318359375, -0.12945938110351562, -0.1202239990234375, -0.11098861694335938, -0.10175323486328125, -0.09251785278320312, -0.083282470703125, -0.07404708862304688, -0.06481170654296875, -0.055576324462890625, -0.0463409423828125, -0.037105560302734375, -0.02787017822265625, -0.018634796142578125, -0.0093994140625, -0.000164031982421875, 0.00907135009765625, 0.018306732177734375, 0.0275421142578125, 0.036777496337890625, 0.04601287841796875, 0.055248260498046875, 0.064483642578125, 0.07371902465820312, 0.08295440673828125, 0.09218978881835938, 0.1014251708984375, 0.11066055297851562, 0.11989593505859375, 0.12913131713867188, 0.13836669921875, 0.14760208129882812, 0.15683746337890625, 0.16607284545898438, 0.1753082275390625, 0.18454360961914062, 0.19377899169921875, 0.20301437377929688, 0.212249755859375, 0.22148513793945312, 0.23072052001953125, 0.23995590209960938, 0.2491912841796875, 0.2584266662597656, 0.26766204833984375, 0.2768974304199219, 0.2861328125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 10.0, 7.0, 13.0, 20.0, 18.0, 44.0, 58.0, 61.0, 75.0, 95.0, 100.0, 101.0, 78.0, 83.0, 55.0, 45.0, 25.0, 23.0, 24.0, 19.0, 13.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.933866024017334, -4.675630569458008, -4.417394638061523, -4.159159183502197, -3.900923728942871, -3.642688274383545, -3.3844525814056396, -3.1262168884277344, -2.867981433868408, -2.609745979309082, -2.3515102863311768, -2.0932745933532715, -1.8350391387939453, -1.5768035650253296, -1.3185679912567139, -1.0603324174880981, -0.8020968437194824, -0.5438612699508667, -0.285625696182251, -0.027390122413635254, 0.23084545135498047, 0.4890810251235962, 0.7473165988922119, 1.0055521726608276, 1.2637877464294434, 1.522023320198059, 1.7802588939666748, 2.03849458694458, 2.2967300415039062, 2.5549654960632324, 2.8132011890411377, 3.071436882019043, 3.329671859741211, 3.587907314300537, 3.8461430072784424, 4.104378700256348, 4.362614154815674, 4.620849609375, 4.879085540771484, 5.1373209953308105, 5.395556449890137, 5.653791904449463, 5.912027359008789, 6.170263290405273, 6.4284987449646, 6.686734199523926, 6.94497013092041, 7.203205585479736, 7.4614410400390625, 7.719676494598389, 7.977911949157715, 8.2361478805542, 8.494382858276367, 8.752618789672852, 9.010854721069336, 9.269089698791504, 9.527325630187988, 9.785561561584473, 10.04379653930664, 10.302032470703125, 10.56026840209961, 10.818503379821777, 11.076739311218262, 11.33497428894043, 11.593210220336914]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 3.0, 10.0, 13.0, 18.0, 20.0, 23.0, 36.0, 23.0, 48.0, 38.0, 55.0, 65.0, 53.0, 52.0, 59.0, 56.0, 68.0, 47.0, 49.0, 36.0, 41.0, 41.0, 23.0, 25.0, 16.0, 12.0, 14.0, 12.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.4476823806762695, -6.265778064727783, -6.083873748779297, -5.901969909667969, -5.720065593719482, -5.538161277770996, -5.35625696182251, -5.174352645874023, -4.992448806762695, -4.810544490814209, -4.628640174865723, -4.4467363357543945, -4.264832019805908, -4.082927703857422, -3.9010233879089355, -3.719119071960449, -3.537214756011963, -3.3553104400634766, -3.1734063625335693, -2.991502046585083, -2.809597969055176, -2.6276936531066895, -2.445789337158203, -2.263885021209717, -2.0819809436798096, -1.9000767469406128, -1.718172550201416, -1.5362682342529297, -1.354364037513733, -1.1724598407745361, -0.9905555248260498, -0.808651328086853, -0.626746654510498, -0.4448424279689789, -0.2629382014274597, -0.08103394508361816, 0.10087025165557861, 0.2827744483947754, 0.4646787643432617, 0.6465829610824585, 0.8284871578216553, 1.010391354560852, 1.1922955513000488, 1.3741998672485352, 1.556104063987732, 1.7380082607269287, 1.919912576675415, 2.1018166542053223, 2.2837209701538086, 2.465625286102295, 2.647529363632202, 2.8294336795806885, 3.0113377571105957, 3.193242073059082, 3.3751463890075684, 3.5570507049560547, 3.738954782485962, 3.9208590984344482, 4.1027631759643555, 4.284667491912842, 4.466571807861328, 4.648475646972656, 4.830380439758301, 5.012284278869629, 5.194188594818115]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 11.0, 15.0, 24.0, 60.0, 76.0, 131.0, 235.0, 498.0, 1079.0, 2551.0, 6874.0, 21585.0, 90725.0, 606178.0, 252253.0, 45816.0, 12694.0, 4393.0, 1764.0, 781.0, 391.0, 183.0, 106.0, 53.0, 24.0, 21.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.265625, -9.013671875, -8.76171875, -8.509765625, -8.2578125, -8.005859375, -7.75390625, -7.501953125, -7.25, -6.998046875, -6.74609375, -6.494140625, -6.2421875, -5.990234375, -5.73828125, -5.486328125, -5.234375, -4.982421875, -4.73046875, -4.478515625, -4.2265625, -3.974609375, -3.72265625, -3.470703125, -3.21875, -2.966796875, -2.71484375, -2.462890625, -2.2109375, -1.958984375, -1.70703125, -1.455078125, -1.203125, -0.951171875, -0.69921875, -0.447265625, -0.1953125, 0.056640625, 0.30859375, 0.560546875, 0.8125, 1.064453125, 1.31640625, 1.568359375, 1.8203125, 2.072265625, 2.32421875, 2.576171875, 2.828125, 3.080078125, 3.33203125, 3.583984375, 3.8359375, 4.087890625, 4.33984375, 4.591796875, 4.84375, 5.095703125, 5.34765625, 5.599609375, 5.8515625, 6.103515625, 6.35546875, 6.607421875, 6.859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 7.0, 12.0, 28.0, 16.0, 26.0, 43.0, 34.0, 43.0, 32.0, 52.0, 56.0, 57.0, 59.0, 61.0, 51.0, 58.0, 45.0, 51.0, 47.0, 35.0, 32.0, 27.0, 14.0, 23.0, 16.0, 11.0, 7.0, 9.0, 3.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.41455078125, -11.0244140625, -10.63427734375, -10.244140625, -9.85400390625, -9.4638671875, -9.07373046875, -8.68359375, -8.29345703125, -7.9033203125, -7.51318359375, -7.123046875, -6.73291015625, -6.3427734375, -5.95263671875, -5.5625, -5.17236328125, -4.7822265625, -4.39208984375, -4.001953125, -3.61181640625, -3.2216796875, -2.83154296875, -2.44140625, -2.05126953125, -1.6611328125, -1.27099609375, -0.880859375, -0.49072265625, -0.1005859375, 0.28955078125, 0.6796875, 1.06982421875, 1.4599609375, 1.85009765625, 2.240234375, 2.63037109375, 3.0205078125, 3.41064453125, 3.80078125, 4.19091796875, 4.5810546875, 4.97119140625, 5.361328125, 5.75146484375, 6.1416015625, 6.53173828125, 6.921875, 7.31201171875, 7.7021484375, 8.09228515625, 8.482421875, 8.87255859375, 9.2626953125, 9.65283203125, 10.04296875, 10.43310546875, 10.8232421875, 11.21337890625, 11.603515625, 11.99365234375, 12.3837890625, 12.77392578125, 13.1640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 9.0, 11.0, 11.0, 17.0, 9.0, 26.0, 33.0, 31.0, 39.0, 49.0, 51.0, 90.0, 363.0, 89971.0, 956387.0, 1014.0, 104.0, 72.0, 51.0, 59.0, 30.0, 30.0, 16.0, 15.0, 18.0, 13.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3125, -65.54736328125, -63.7822265625, -62.01708984375, -60.251953125, -58.48681640625, -56.7216796875, -54.95654296875, -53.19140625, -51.42626953125, -49.6611328125, -47.89599609375, -46.130859375, -44.36572265625, -42.6005859375, -40.83544921875, -39.0703125, -37.30517578125, -35.5400390625, -33.77490234375, -32.009765625, -30.24462890625, -28.4794921875, -26.71435546875, -24.94921875, -23.18408203125, -21.4189453125, -19.65380859375, -17.888671875, -16.12353515625, -14.3583984375, -12.59326171875, -10.828125, -9.06298828125, -7.2978515625, -5.53271484375, -3.767578125, -2.00244140625, -0.2373046875, 1.52783203125, 3.29296875, 5.05810546875, 6.8232421875, 8.58837890625, 10.353515625, 12.11865234375, 13.8837890625, 15.64892578125, 17.4140625, 19.17919921875, 20.9443359375, 22.70947265625, 24.474609375, 26.23974609375, 28.0048828125, 29.77001953125, 31.53515625, 33.30029296875, 35.0654296875, 36.83056640625, 38.595703125, 40.36083984375, 42.1259765625, 43.89111328125, 45.65625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 12.0, 11.0, 11.0, 17.0, 24.0, 30.0, 45.0, 28.0, 58.0, 51.0, 71.0, 65.0, 59.0, 66.0, 57.0, 50.0, 59.0, 56.0, 58.0, 36.0, 28.0, 25.0, 15.0, 16.0, 14.0, 4.0, 8.0, 9.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.140625, -19.63818359375, -19.1357421875, -18.63330078125, -18.130859375, -17.62841796875, -17.1259765625, -16.62353515625, -16.12109375, -15.61865234375, -15.1162109375, -14.61376953125, -14.111328125, -13.60888671875, -13.1064453125, -12.60400390625, -12.1015625, -11.59912109375, -11.0966796875, -10.59423828125, -10.091796875, -9.58935546875, -9.0869140625, -8.58447265625, -8.08203125, -7.57958984375, -7.0771484375, -6.57470703125, -6.072265625, -5.56982421875, -5.0673828125, -4.56494140625, -4.0625, -3.56005859375, -3.0576171875, -2.55517578125, -2.052734375, -1.55029296875, -1.0478515625, -0.54541015625, -0.04296875, 0.45947265625, 0.9619140625, 1.46435546875, 1.966796875, 2.46923828125, 2.9716796875, 3.47412109375, 3.9765625, 4.47900390625, 4.9814453125, 5.48388671875, 5.986328125, 6.48876953125, 6.9912109375, 7.49365234375, 7.99609375, 8.49853515625, 9.0009765625, 9.50341796875, 10.005859375, 10.50830078125, 11.0107421875, 11.51318359375, 12.015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 10.0, 11.0, 22.0, 15.0, 26.0, 34.0, 51.0, 67.0, 116.0, 191.0, 361.0, 597.0, 1371.0, 3260.0, 9154.0, 32447.0, 166301.0, 708179.0, 93960.0, 21096.0, 6447.0, 2533.0, 1018.0, 536.0, 281.0, 158.0, 105.0, 64.0, 40.0, 27.0, 14.0, 18.0, 9.0, 6.0, 4.0, 6.0, 7.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.4532470703125, -2.363525390625, -2.2738037109375, -2.18408203125, -2.0943603515625, -2.004638671875, -1.9149169921875, -1.8251953125, -1.7354736328125, -1.645751953125, -1.5560302734375, -1.46630859375, -1.3765869140625, -1.286865234375, -1.1971435546875, -1.107421875, -1.0177001953125, -0.927978515625, -0.8382568359375, -0.74853515625, -0.6588134765625, -0.569091796875, -0.4793701171875, -0.3896484375, -0.2999267578125, -0.210205078125, -0.1204833984375, -0.03076171875, 0.0589599609375, 0.148681640625, 0.2384033203125, 0.328125, 0.4178466796875, 0.507568359375, 0.5972900390625, 0.68701171875, 0.7767333984375, 0.866455078125, 0.9561767578125, 1.0458984375, 1.1356201171875, 1.225341796875, 1.3150634765625, 1.40478515625, 1.4945068359375, 1.584228515625, 1.6739501953125, 1.763671875, 1.8533935546875, 1.943115234375, 2.0328369140625, 2.12255859375, 2.2122802734375, 2.302001953125, 2.3917236328125, 2.4814453125, 2.5711669921875, 2.660888671875, 2.7506103515625, 2.84033203125, 2.9300537109375, 3.019775390625, 3.1094970703125, 3.19921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 13.0, 15.0, 25.0, 20.0, 38.0, 56.0, 100.0, 192.0, 253.0, 94.0, 55.0, 37.0, 33.0, 23.0, 11.0, 7.0, 9.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038909912109375, -0.0003706887364387512, -0.00035227835178375244, -0.00033386796712875366, -0.0003154575824737549, -0.0002970471978187561, -0.0002786368131637573, -0.00026022642850875854, -0.00024181604385375977, -0.00022340565919876099, -0.0002049952745437622, -0.00018658488988876343, -0.00016817450523376465, -0.00014976412057876587, -0.0001313537359237671, -0.00011294335126876831, -9.453296661376953e-05, -7.612258195877075e-05, -5.771219730377197e-05, -3.930181264877319e-05, -2.0891427993774414e-05, -2.4810433387756348e-06, 1.5929341316223145e-05, 3.4339725971221924e-05, 5.27501106262207e-05, 7.116049528121948e-05, 8.957087993621826e-05, 0.00010798126459121704, 0.00012639164924621582, 0.0001448020339012146, 0.00016321241855621338, 0.00018162280321121216, 0.00020003318786621094, 0.00021844357252120972, 0.0002368539571762085, 0.0002552643418312073, 0.00027367472648620605, 0.00029208511114120483, 0.0003104954957962036, 0.0003289058804512024, 0.00034731626510620117, 0.00036572664976119995, 0.00038413703441619873, 0.0004025474190711975, 0.0004209578037261963, 0.00043936818838119507, 0.00045777857303619385, 0.0004761889576911926, 0.0004945993423461914, 0.0005130097270011902, 0.000531420111656189, 0.0005498304963111877, 0.0005682408809661865, 0.0005866512656211853, 0.0006050616502761841, 0.0006234720349311829, 0.0006418824195861816, 0.0006602928042411804, 0.0006787031888961792, 0.000697113573551178, 0.0007155239582061768, 0.0007339343428611755, 0.0007523447275161743, 0.0007707551121711731, 0.0007891654968261719]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 5.0, 4.0, 9.0, 12.0, 12.0, 32.0, 46.0, 82.0, 142.0, 262.0, 486.0, 1034.0, 2343.0, 5939.0, 19098.0, 83532.0, 697340.0, 187381.0, 34492.0, 9709.0, 3538.0, 1506.0, 705.0, 371.0, 187.0, 119.0, 68.0, 33.0, 20.0, 21.0, 11.0, 7.0, 4.0, 2.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.654296875, -2.564971923828125, -2.47564697265625, -2.386322021484375, -2.2969970703125, -2.207672119140625, -2.11834716796875, -2.029022216796875, -1.939697265625, -1.850372314453125, -1.76104736328125, -1.671722412109375, -1.5823974609375, -1.493072509765625, -1.40374755859375, -1.314422607421875, -1.22509765625, -1.135772705078125, -1.04644775390625, -0.957122802734375, -0.8677978515625, -0.778472900390625, -0.68914794921875, -0.599822998046875, -0.510498046875, -0.421173095703125, -0.33184814453125, -0.242523193359375, -0.1531982421875, -0.063873291015625, 0.02545166015625, 0.114776611328125, 0.2041015625, 0.293426513671875, 0.38275146484375, 0.472076416015625, 0.5614013671875, 0.650726318359375, 0.74005126953125, 0.829376220703125, 0.918701171875, 1.008026123046875, 1.09735107421875, 1.186676025390625, 1.2760009765625, 1.365325927734375, 1.45465087890625, 1.543975830078125, 1.63330078125, 1.722625732421875, 1.81195068359375, 1.901275634765625, 1.9906005859375, 2.079925537109375, 2.16925048828125, 2.258575439453125, 2.347900390625, 2.437225341796875, 2.52655029296875, 2.615875244140625, 2.7052001953125, 2.794525146484375, 2.88385009765625, 2.973175048828125, 3.0625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 7.0, 17.0, 15.0, 21.0, 27.0, 38.0, 38.0, 60.0, 80.0, 272.0, 97.0, 57.0, 44.0, 42.0, 29.0, 27.0, 22.0, 25.0, 14.0, 10.0, 9.0, 5.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71142578125, -0.6751480102539062, -0.6388702392578125, -0.6025924682617188, -0.566314697265625, -0.5300369262695312, -0.4937591552734375, -0.45748138427734375, -0.42120361328125, -0.38492584228515625, -0.3486480712890625, -0.31237030029296875, -0.276092529296875, -0.23981475830078125, -0.2035369873046875, -0.16725921630859375, -0.1309814453125, -0.09470367431640625, -0.0584259033203125, -0.02214813232421875, 0.014129638671875, 0.05040740966796875, 0.0866851806640625, 0.12296295166015625, 0.15924072265625, 0.19551849365234375, 0.2317962646484375, 0.26807403564453125, 0.304351806640625, 0.34062957763671875, 0.3769073486328125, 0.41318511962890625, 0.449462890625, 0.48574066162109375, 0.5220184326171875, 0.5582962036132812, 0.594573974609375, 0.6308517456054688, 0.6671295166015625, 0.7034072875976562, 0.73968505859375, 0.7759628295898438, 0.8122406005859375, 0.8485183715820312, 0.884796142578125, 0.9210739135742188, 0.9573516845703125, 0.9936294555664062, 1.0299072265625, 1.0661849975585938, 1.1024627685546875, 1.1387405395507812, 1.175018310546875, 1.2112960815429688, 1.2475738525390625, 1.2838516235351562, 1.32012939453125, 1.3564071655273438, 1.3926849365234375, 1.4289627075195312, 1.465240478515625, 1.5015182495117188, 1.5377960205078125, 1.5740737915039062, 1.6103515625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 22.0, 99.0, 316.0, 367.0, 147.0, 47.0, 7.0, 7.0, 1.0, 0.0, 1.0], "bins": [-125.51412200927734, -123.28372955322266, -121.05333709716797, -118.82294464111328, -116.59255981445312, -114.36216735839844, -112.13177490234375, -109.90138244628906, -107.67098999023438, -105.44059753417969, -103.210205078125, -100.97981262207031, -98.74942016601562, -96.51903533935547, -94.28864288330078, -92.0582504272461, -89.8278579711914, -87.59746551513672, -85.36707305908203, -83.13668060302734, -80.90629577636719, -78.6759033203125, -76.44551086425781, -74.21511840820312, -71.98472595214844, -69.75433349609375, -67.52394104003906, -65.29354858398438, -63.06315994262695, -60.832767486572266, -58.602378845214844, -56.371986389160156, -54.14158630371094, -51.91119384765625, -49.68080139160156, -47.45041275024414, -45.22002029418945, -42.989627838134766, -40.759239196777344, -38.528846740722656, -36.29845428466797, -34.06806182861328, -31.837671279907227, -29.607280731201172, -27.376888275146484, -25.146495819091797, -22.916105270385742, -20.685714721679688, -18.455324172973633, -16.224933624267578, -13.99454116821289, -11.76414966583252, -9.533758163452148, -7.303366661071777, -5.072975158691406, -2.842583656311035, -0.6121921539306641, 1.618199348449707, 3.848590850830078, 6.078982353210449, 8.30937385559082, 10.539765357971191, 12.770156860351562, 15.000548362731934, 17.230939865112305]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 3.0, 4.0, 10.0, 9.0, 10.0, 9.0, 17.0, 14.0, 18.0, 23.0, 22.0, 34.0, 24.0, 38.0, 31.0, 42.0, 46.0, 36.0, 41.0, 43.0, 54.0, 50.0, 44.0, 43.0, 39.0, 47.0, 39.0, 31.0, 37.0, 21.0, 22.0, 23.0, 12.0, 14.0, 15.0, 8.0, 3.0, 9.0, 2.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.739897727966309, -13.230113983154297, -12.720330238342285, -12.210546493530273, -11.700762748718262, -11.19097900390625, -10.681195259094238, -10.171411514282227, -9.661627769470215, -9.151844024658203, -8.642060279846191, -8.13227653503418, -7.622492790222168, -7.112709045410156, -6.6029253005981445, -6.093141555786133, -5.583357810974121, -5.073574066162109, -4.563790321350098, -4.054006576538086, -3.544222831726074, -3.0344390869140625, -2.524655342102051, -2.014871597290039, -1.5050878524780273, -0.9953041076660156, -0.4855203628540039, 0.024263381958007812, 0.5340471267700195, 1.0438308715820312, 1.553614616394043, 2.0633983612060547, 2.57318115234375, 3.0829648971557617, 3.5927486419677734, 4.102532386779785, 4.612316131591797, 5.122099876403809, 5.63188362121582, 6.141667366027832, 6.651451110839844, 7.1612348556518555, 7.671018600463867, 8.180802345275879, 8.69058609008789, 9.200369834899902, 9.710153579711914, 10.219937324523926, 10.729721069335938, 11.23950481414795, 11.749288558959961, 12.259072303771973, 12.768856048583984, 13.278639793395996, 13.788423538208008, 14.29820728302002, 14.807991027832031, 15.317774772644043, 15.827558517456055, 16.33734130859375, 16.847126007080078, 17.356910705566406, 17.8666934967041, 18.376476287841797, 18.886260986328125]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 10.0, 7.0, 18.0, 20.0, 23.0, 27.0, 70.0, 125.0, 204.0, 399.0, 754.0, 1791.0, 4335.0, 13295.0, 61693.0, 688070.0, 2982350.0, 384360.0, 40644.0, 9716.0, 3384.0, 1424.0, 680.0, 376.0, 192.0, 112.0, 69.0, 29.0, 22.0, 16.0, 23.0, 13.0, 15.0, 4.0, 3.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.364990234375, -12.92529296875, -12.485595703125, -12.0458984375, -11.606201171875, -11.16650390625, -10.726806640625, -10.287109375, -9.847412109375, -9.40771484375, -8.968017578125, -8.5283203125, -8.088623046875, -7.64892578125, -7.209228515625, -6.76953125, -6.329833984375, -5.89013671875, -5.450439453125, -5.0107421875, -4.571044921875, -4.13134765625, -3.691650390625, -3.251953125, -2.812255859375, -2.37255859375, -1.932861328125, -1.4931640625, -1.053466796875, -0.61376953125, -0.174072265625, 0.265625, 0.705322265625, 1.14501953125, 1.584716796875, 2.0244140625, 2.464111328125, 2.90380859375, 3.343505859375, 3.783203125, 4.222900390625, 4.66259765625, 5.102294921875, 5.5419921875, 5.981689453125, 6.42138671875, 6.861083984375, 7.30078125, 7.740478515625, 8.18017578125, 8.619873046875, 9.0595703125, 9.499267578125, 9.93896484375, 10.378662109375, 10.818359375, 11.258056640625, 11.69775390625, 12.137451171875, 12.5771484375, 13.016845703125, 13.45654296875, 13.896240234375, 14.3359375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 7.0, 3.0, 16.0, 16.0, 21.0, 12.0, 30.0, 35.0, 36.0, 34.0, 50.0, 61.0, 63.0, 61.0, 51.0, 58.0, 38.0, 57.0, 46.0, 58.0, 45.0, 30.0, 41.0, 21.0, 16.0, 22.0, 19.0, 9.0, 9.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.12017822265625, -5.8848876953125, -5.64959716796875, -5.414306640625, -5.17901611328125, -4.9437255859375, -4.70843505859375, -4.47314453125, -4.23785400390625, -4.0025634765625, -3.76727294921875, -3.531982421875, -3.29669189453125, -3.0614013671875, -2.82611083984375, -2.5908203125, -2.35552978515625, -2.1202392578125, -1.88494873046875, -1.649658203125, -1.41436767578125, -1.1790771484375, -0.94378662109375, -0.70849609375, -0.47320556640625, -0.2379150390625, -0.00262451171875, 0.232666015625, 0.46795654296875, 0.7032470703125, 0.93853759765625, 1.173828125, 1.40911865234375, 1.6444091796875, 1.87969970703125, 2.114990234375, 2.35028076171875, 2.5855712890625, 2.82086181640625, 3.05615234375, 3.29144287109375, 3.5267333984375, 3.76202392578125, 3.997314453125, 4.23260498046875, 4.4678955078125, 4.70318603515625, 4.9384765625, 5.17376708984375, 5.4090576171875, 5.64434814453125, 5.879638671875, 6.11492919921875, 6.3502197265625, 6.58551025390625, 6.82080078125, 7.05609130859375, 7.2913818359375, 7.52667236328125, 7.761962890625, 7.99725341796875, 8.2325439453125, 8.46783447265625, 8.703125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 14.0, 26.0, 53.0, 108.0, 285.0, 1851.0, 177491.0, 4005482.0, 8052.0, 555.0, 165.0, 64.0, 41.0, 27.0, 12.0, 13.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-50.9375, -49.4912109375, -48.044921875, -46.5986328125, -45.15234375, -43.7060546875, -42.259765625, -40.8134765625, -39.3671875, -37.9208984375, -36.474609375, -35.0283203125, -33.58203125, -32.1357421875, -30.689453125, -29.2431640625, -27.796875, -26.3505859375, -24.904296875, -23.4580078125, -22.01171875, -20.5654296875, -19.119140625, -17.6728515625, -16.2265625, -14.7802734375, -13.333984375, -11.8876953125, -10.44140625, -8.9951171875, -7.548828125, -6.1025390625, -4.65625, -3.2099609375, -1.763671875, -0.3173828125, 1.12890625, 2.5751953125, 4.021484375, 5.4677734375, 6.9140625, 8.3603515625, 9.806640625, 11.2529296875, 12.69921875, 14.1455078125, 15.591796875, 17.0380859375, 18.484375, 19.9306640625, 21.376953125, 22.8232421875, 24.26953125, 25.7158203125, 27.162109375, 28.6083984375, 30.0546875, 31.5009765625, 32.947265625, 34.3935546875, 35.83984375, 37.2861328125, 38.732421875, 40.1787109375, 41.625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 5.0, 13.0, 14.0, 14.0, 28.0, 40.0, 46.0, 60.0, 93.0, 113.0, 184.0, 291.0, 425.0, 661.0, 602.0, 480.0, 323.0, 197.0, 143.0, 90.0, 64.0, 49.0, 30.0, 24.0, 34.0, 15.0, 11.0, 3.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.71484375, -3.61199951171875, -3.5091552734375, -3.40631103515625, -3.303466796875, -3.20062255859375, -3.0977783203125, -2.99493408203125, -2.89208984375, -2.78924560546875, -2.6864013671875, -2.58355712890625, -2.480712890625, -2.37786865234375, -2.2750244140625, -2.17218017578125, -2.0693359375, -1.96649169921875, -1.8636474609375, -1.76080322265625, -1.657958984375, -1.55511474609375, -1.4522705078125, -1.34942626953125, -1.24658203125, -1.14373779296875, -1.0408935546875, -0.93804931640625, -0.835205078125, -0.73236083984375, -0.6295166015625, -0.52667236328125, -0.423828125, -0.32098388671875, -0.2181396484375, -0.11529541015625, -0.012451171875, 0.09039306640625, 0.1932373046875, 0.29608154296875, 0.39892578125, 0.50177001953125, 0.6046142578125, 0.70745849609375, 0.810302734375, 0.91314697265625, 1.0159912109375, 1.11883544921875, 1.2216796875, 1.32452392578125, 1.4273681640625, 1.53021240234375, 1.633056640625, 1.73590087890625, 1.8387451171875, 1.94158935546875, 2.04443359375, 2.14727783203125, 2.2501220703125, 2.35296630859375, 2.455810546875, 2.55865478515625, 2.6614990234375, 2.76434326171875, 2.8671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 8.0, 23.0, 22.0, 39.0, 61.0, 88.0, 90.0, 110.0, 126.0, 107.0, 84.0, 65.0, 40.0, 42.0, 29.0, 18.0, 13.0, 6.0, 10.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.584258079528809, -10.113957405090332, -9.643655776977539, -9.173355102539062, -8.70305347442627, -8.232752799987793, -7.762451648712158, -7.292150497436523, -6.821849346160889, -6.351548194885254, -5.881247043609619, -5.410945892333984, -4.940645217895508, -4.470343589782715, -4.000042915344238, -3.5297417640686035, -3.0594406127929688, -2.589139461517334, -2.118838310241699, -1.6485373973846436, -1.1782362461090088, -0.707935094833374, -0.23763418197631836, 0.2326669692993164, 0.7029681205749512, 1.173269271850586, 1.6435703039169312, 2.1138713359832764, 2.584172487258911, 3.054473638534546, 3.5247745513916016, 3.9950757026672363, 4.4653778076171875, 4.935678958892822, 5.405980110168457, 5.876280784606934, 6.346582412719727, 6.816883087158203, 7.287184238433838, 7.757485389709473, 8.227787017822266, 8.698087692260742, 9.168389320373535, 9.638689994812012, 10.108991622924805, 10.579292297363281, 11.049592971801758, 11.51989459991455, 11.990195274353027, 12.460495948791504, 12.930797576904297, 13.401098251342773, 13.871399879455566, 14.341700553894043, 14.812002182006836, 15.282302856445312, 15.752603530883789, 16.222904205322266, 16.693204879760742, 17.16350746154785, 17.633808135986328, 18.104108810424805, 18.57440948486328, 19.04471206665039, 19.515012741088867]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 1.0, 5.0, 8.0, 4.0, 7.0, 15.0, 15.0, 13.0, 21.0, 17.0, 25.0, 41.0, 42.0, 26.0, 37.0, 43.0, 45.0, 48.0, 47.0, 46.0, 59.0, 42.0, 51.0, 45.0, 41.0, 34.0, 33.0, 36.0, 29.0, 30.0, 12.0, 10.0, 23.0, 7.0, 5.0, 4.0, 10.0, 4.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.390345573425293, -7.156287670135498, -6.922229766845703, -6.688171863555908, -6.454113960266113, -6.220056056976318, -5.985998153686523, -5.751940727233887, -5.517882347106934, -5.283824443817139, -5.049766540527344, -4.815708637237549, -4.581650733947754, -4.347592830657959, -4.113534927368164, -3.8794772624969482, -3.6454195976257324, -3.4113616943359375, -3.1773037910461426, -2.9432458877563477, -2.7091879844665527, -2.475130081176758, -2.241072416305542, -2.007014513015747, -1.7729566097259521, -1.5388987064361572, -1.3048408031463623, -1.070783019065857, -0.836725115776062, -0.6026672124862671, -0.3686094284057617, -0.1345515251159668, 0.09950590133666992, 0.33356377482414246, 0.567621648311615, 0.8016794919967651, 1.03573739528656, 1.269795298576355, 1.5038530826568604, 1.7379109859466553, 1.9719688892364502, 2.206026792526245, 2.44008469581604, 2.674142360687256, 2.908200263977051, 3.1422581672668457, 3.3763160705566406, 3.6103739738464355, 3.8444318771362305, 4.078489780426025, 4.31254768371582, 4.546605587005615, 4.78066349029541, 5.014721393585205, 5.248779296875, 5.482836723327637, 5.71689510345459, 5.950953006744385, 6.18501091003418, 6.419068813323975, 6.6531267166137695, 6.8871846199035645, 7.121242523193359, 7.355299949645996, 7.589357852935791]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 7.0, 9.0, 17.0, 13.0, 23.0, 26.0, 40.0, 89.0, 185.0, 352.0, 988.0, 3157.0, 12995.0, 67491.0, 460773.0, 423665.0, 62159.0, 11942.0, 2931.0, 941.0, 352.0, 152.0, 85.0, 56.0, 43.0, 29.0, 6.0, 7.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.19232177734375, -4.0174560546875, -3.84259033203125, -3.667724609375, -3.49285888671875, -3.3179931640625, -3.14312744140625, -2.96826171875, -2.79339599609375, -2.6185302734375, -2.44366455078125, -2.268798828125, -2.09393310546875, -1.9190673828125, -1.74420166015625, -1.5693359375, -1.39447021484375, -1.2196044921875, -1.04473876953125, -0.869873046875, -0.69500732421875, -0.5201416015625, -0.34527587890625, -0.17041015625, 0.00445556640625, 0.1793212890625, 0.35418701171875, 0.529052734375, 0.70391845703125, 0.8787841796875, 1.05364990234375, 1.228515625, 1.40338134765625, 1.5782470703125, 1.75311279296875, 1.927978515625, 2.10284423828125, 2.2777099609375, 2.45257568359375, 2.62744140625, 2.80230712890625, 2.9771728515625, 3.15203857421875, 3.326904296875, 3.50177001953125, 3.6766357421875, 3.85150146484375, 4.0263671875, 4.20123291015625, 4.3760986328125, 4.55096435546875, 4.725830078125, 4.90069580078125, 5.0755615234375, 5.25042724609375, 5.42529296875, 5.60015869140625, 5.7750244140625, 5.94989013671875, 6.124755859375, 6.29962158203125, 6.4744873046875, 6.64935302734375, 6.82421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 11.0, 5.0, 7.0, 12.0, 17.0, 29.0, 33.0, 36.0, 50.0, 59.0, 69.0, 67.0, 61.0, 74.0, 69.0, 77.0, 74.0, 42.0, 52.0, 37.0, 35.0, 21.0, 22.0, 10.0, 8.0, 9.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58203125, -4.37982177734375, -4.1776123046875, -3.97540283203125, -3.773193359375, -3.57098388671875, -3.3687744140625, -3.16656494140625, -2.96435546875, -2.76214599609375, -2.5599365234375, -2.35772705078125, -2.155517578125, -1.95330810546875, -1.7510986328125, -1.54888916015625, -1.3466796875, -1.14447021484375, -0.9422607421875, -0.74005126953125, -0.537841796875, -0.33563232421875, -0.1334228515625, 0.06878662109375, 0.27099609375, 0.47320556640625, 0.6754150390625, 0.87762451171875, 1.079833984375, 1.28204345703125, 1.4842529296875, 1.68646240234375, 1.888671875, 2.09088134765625, 2.2930908203125, 2.49530029296875, 2.697509765625, 2.89971923828125, 3.1019287109375, 3.30413818359375, 3.50634765625, 3.70855712890625, 3.9107666015625, 4.11297607421875, 4.315185546875, 4.51739501953125, 4.7196044921875, 4.92181396484375, 5.1240234375, 5.32623291015625, 5.5284423828125, 5.73065185546875, 5.932861328125, 6.13507080078125, 6.3372802734375, 6.53948974609375, 6.74169921875, 6.94390869140625, 7.1461181640625, 7.34832763671875, 7.550537109375, 7.75274658203125, 7.9549560546875, 8.15716552734375, 8.359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 6.0, 7.0, 4.0, 9.0, 12.0, 17.0, 19.0, 27.0, 33.0, 39.0, 57.0, 85.0, 128.0, 255.0, 355.0, 605.0, 1156.0, 2320.0, 5225.0, 11909.0, 30165.0, 80080.0, 224041.0, 395073.0, 185511.0, 66349.0, 25654.0, 10298.0, 4445.0, 2129.0, 1044.0, 555.0, 306.0, 211.0, 127.0, 94.0, 62.0, 40.0, 23.0, 18.0, 12.0, 9.0, 7.0, 11.0, 6.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.58984375, -2.50738525390625, -2.4249267578125, -2.34246826171875, -2.260009765625, -2.17755126953125, -2.0950927734375, -2.01263427734375, -1.93017578125, -1.84771728515625, -1.7652587890625, -1.68280029296875, -1.600341796875, -1.51788330078125, -1.4354248046875, -1.35296630859375, -1.2705078125, -1.18804931640625, -1.1055908203125, -1.02313232421875, -0.940673828125, -0.85821533203125, -0.7757568359375, -0.69329833984375, -0.61083984375, -0.52838134765625, -0.4459228515625, -0.36346435546875, -0.281005859375, -0.19854736328125, -0.1160888671875, -0.03363037109375, 0.048828125, 0.13128662109375, 0.2137451171875, 0.29620361328125, 0.378662109375, 0.46112060546875, 0.5435791015625, 0.62603759765625, 0.70849609375, 0.79095458984375, 0.8734130859375, 0.95587158203125, 1.038330078125, 1.12078857421875, 1.2032470703125, 1.28570556640625, 1.3681640625, 1.45062255859375, 1.5330810546875, 1.61553955078125, 1.697998046875, 1.78045654296875, 1.8629150390625, 1.94537353515625, 2.02783203125, 2.11029052734375, 2.1927490234375, 2.27520751953125, 2.357666015625, 2.44012451171875, 2.5225830078125, 2.60504150390625, 2.6875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 10.0, 8.0, 7.0, 12.0, 17.0, 15.0, 19.0, 32.0, 31.0, 36.0, 32.0, 34.0, 37.0, 54.0, 52.0, 37.0, 41.0, 42.0, 42.0, 51.0, 42.0, 36.0, 31.0, 46.0, 25.0, 38.0, 25.0, 30.0, 29.0, 19.0, 10.0, 13.0, 16.0, 5.0, 5.0, 10.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.09991455078125, -8.8326416015625, -8.56536865234375, -8.298095703125, -8.03082275390625, -7.7635498046875, -7.49627685546875, -7.22900390625, -6.96173095703125, -6.6944580078125, -6.42718505859375, -6.159912109375, -5.89263916015625, -5.6253662109375, -5.35809326171875, -5.0908203125, -4.82354736328125, -4.5562744140625, -4.28900146484375, -4.021728515625, -3.75445556640625, -3.4871826171875, -3.21990966796875, -2.95263671875, -2.68536376953125, -2.4180908203125, -2.15081787109375, -1.883544921875, -1.61627197265625, -1.3489990234375, -1.08172607421875, -0.814453125, -0.54718017578125, -0.2799072265625, -0.01263427734375, 0.254638671875, 0.52191162109375, 0.7891845703125, 1.05645751953125, 1.32373046875, 1.59100341796875, 1.8582763671875, 2.12554931640625, 2.392822265625, 2.66009521484375, 2.9273681640625, 3.19464111328125, 3.4619140625, 3.72918701171875, 3.9964599609375, 4.26373291015625, 4.531005859375, 4.79827880859375, 5.0655517578125, 5.33282470703125, 5.60009765625, 5.86737060546875, 6.1346435546875, 6.40191650390625, 6.669189453125, 6.93646240234375, 7.2037353515625, 7.47100830078125, 7.73828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 10.0, 11.0, 20.0, 29.0, 45.0, 68.0, 93.0, 160.0, 265.0, 417.0, 702.0, 1250.0, 2263.0, 4556.0, 9536.0, 22130.0, 56731.0, 167781.0, 383536.0, 256296.0, 85720.0, 31425.0, 12818.0, 6028.0, 2907.0, 1562.0, 830.0, 496.0, 273.0, 200.0, 127.0, 90.0, 51.0, 36.0, 21.0, 20.0, 11.0, 9.0, 9.0, 3.0, 2.0, 0.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9052734375, -0.8775863647460938, -0.8498992919921875, -0.8222122192382812, -0.794525146484375, -0.7668380737304688, -0.7391510009765625, -0.7114639282226562, -0.68377685546875, -0.6560897827148438, -0.6284027099609375, -0.6007156372070312, -0.573028564453125, -0.5453414916992188, -0.5176544189453125, -0.48996734619140625, -0.4622802734375, -0.43459320068359375, -0.4069061279296875, -0.37921905517578125, -0.351531982421875, -0.32384490966796875, -0.2961578369140625, -0.26847076416015625, -0.24078369140625, -0.21309661865234375, -0.1854095458984375, -0.15772247314453125, -0.130035400390625, -0.10234832763671875, -0.0746612548828125, -0.04697418212890625, -0.019287109375, 0.00839996337890625, 0.0360870361328125, 0.06377410888671875, 0.091461181640625, 0.11914825439453125, 0.1468353271484375, 0.17452239990234375, 0.20220947265625, 0.22989654541015625, 0.2575836181640625, 0.28527069091796875, 0.312957763671875, 0.34064483642578125, 0.3683319091796875, 0.39601898193359375, 0.4237060546875, 0.45139312744140625, 0.4790802001953125, 0.5067672729492188, 0.534454345703125, 0.5621414184570312, 0.5898284912109375, 0.6175155639648438, 0.64520263671875, 0.6728897094726562, 0.7005767822265625, 0.7282638549804688, 0.755950927734375, 0.7836380004882812, 0.8113250732421875, 0.8390121459960938, 0.86669921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 0.0, 4.0, 4.0, 5.0, 3.0, 7.0, 11.0, 19.0, 26.0, 32.0, 41.0, 56.0, 62.0, 70.0, 110.0, 102.0, 90.0, 85.0, 71.0, 49.0, 30.0, 31.0, 28.0, 14.0, 17.0, 7.0, 2.0, 6.0, 9.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006198883056640625, -0.0006008297204971313, -0.0005817711353302002, -0.000562712550163269, -0.0005436539649963379, -0.0005245953798294067, -0.0005055367946624756, -0.00048647820949554443, -0.0004674196243286133, -0.00044836103916168213, -0.000429302453994751, -0.0004102438688278198, -0.00039118528366088867, -0.0003721266984939575, -0.00035306811332702637, -0.0003340095281600952, -0.00031495094299316406, -0.0002958923578262329, -0.00027683377265930176, -0.0002577751874923706, -0.00023871660232543945, -0.0002196580171585083, -0.00020059943199157715, -0.000181540846824646, -0.00016248226165771484, -0.0001434236764907837, -0.00012436509132385254, -0.00010530650615692139, -8.624792098999023e-05, -6.718933582305908e-05, -4.813075065612793e-05, -2.9072165489196777e-05, -1.0013580322265625e-05, 9.045004844665527e-06, 2.810359001159668e-05, 4.716217517852783e-05, 6.622076034545898e-05, 8.527934551239014e-05, 0.00010433793067932129, 0.00012339651584625244, 0.0001424551010131836, 0.00016151368618011475, 0.0001805722713470459, 0.00019963085651397705, 0.0002186894416809082, 0.00023774802684783936, 0.0002568066120147705, 0.00027586519718170166, 0.0002949237823486328, 0.00031398236751556396, 0.0003330409526824951, 0.00035209953784942627, 0.0003711581230163574, 0.0003902167081832886, 0.0004092752933502197, 0.0004283338785171509, 0.00044739246368408203, 0.0004664510488510132, 0.00048550963401794434, 0.0005045682191848755, 0.0005236268043518066, 0.0005426853895187378, 0.0005617439746856689, 0.0005808025598526001, 0.0005998611450195312]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 8.0, 12.0, 15.0, 15.0, 20.0, 18.0, 33.0, 62.0, 95.0, 182.0, 297.0, 564.0, 1449.0, 3790.0, 11856.0, 43934.0, 187987.0, 494666.0, 228760.0, 53286.0, 13983.0, 4433.0, 1553.0, 700.0, 309.0, 167.0, 96.0, 62.0, 32.0, 42.0, 34.0, 15.0, 19.0, 2.0, 5.0, 7.0, 3.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-1.232421875, -1.194580078125, -1.15673828125, -1.118896484375, -1.0810546875, -1.043212890625, -1.00537109375, -0.967529296875, -0.9296875, -0.891845703125, -0.85400390625, -0.816162109375, -0.7783203125, -0.740478515625, -0.70263671875, -0.664794921875, -0.626953125, -0.589111328125, -0.55126953125, -0.513427734375, -0.4755859375, -0.437744140625, -0.39990234375, -0.362060546875, -0.32421875, -0.286376953125, -0.24853515625, -0.210693359375, -0.1728515625, -0.135009765625, -0.09716796875, -0.059326171875, -0.021484375, 0.016357421875, 0.05419921875, 0.092041015625, 0.1298828125, 0.167724609375, 0.20556640625, 0.243408203125, 0.28125, 0.319091796875, 0.35693359375, 0.394775390625, 0.4326171875, 0.470458984375, 0.50830078125, 0.546142578125, 0.583984375, 0.621826171875, 0.65966796875, 0.697509765625, 0.7353515625, 0.773193359375, 0.81103515625, 0.848876953125, 0.88671875, 0.924560546875, 0.96240234375, 1.000244140625, 1.0380859375, 1.075927734375, 1.11376953125, 1.151611328125, 1.189453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 9.0, 4.0, 5.0, 11.0, 5.0, 12.0, 11.0, 19.0, 32.0, 29.0, 25.0, 40.0, 39.0, 43.0, 51.0, 62.0, 61.0, 74.0, 84.0, 71.0, 51.0, 49.0, 40.0, 36.0, 22.0, 26.0, 23.0, 14.0, 7.0, 8.0, 7.0, 8.0, 8.0, 8.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.2454833984375, -0.2384490966796875, -0.231414794921875, -0.2243804931640625, -0.21734619140625, -0.2103118896484375, -0.203277587890625, -0.1962432861328125, -0.189208984375, -0.1821746826171875, -0.175140380859375, -0.1681060791015625, -0.16107177734375, -0.1540374755859375, -0.147003173828125, -0.1399688720703125, -0.1329345703125, -0.1259002685546875, -0.118865966796875, -0.1118316650390625, -0.10479736328125, -0.0977630615234375, -0.090728759765625, -0.0836944580078125, -0.07666015625, -0.0696258544921875, -0.062591552734375, -0.0555572509765625, -0.04852294921875, -0.0414886474609375, -0.034454345703125, -0.0274200439453125, -0.0203857421875, -0.0133514404296875, -0.006317138671875, 0.0007171630859375, 0.00775146484375, 0.0147857666015625, 0.021820068359375, 0.0288543701171875, 0.035888671875, 0.0429229736328125, 0.049957275390625, 0.0569915771484375, 0.06402587890625, 0.0710601806640625, 0.078094482421875, 0.0851287841796875, 0.0921630859375, 0.0991973876953125, 0.106231689453125, 0.1132659912109375, 0.12030029296875, 0.1273345947265625, 0.134368896484375, 0.1414031982421875, 0.1484375, 0.1554718017578125, 0.162506103515625, 0.1695404052734375, 0.17657470703125, 0.1836090087890625, 0.190643310546875, 0.1976776123046875, 0.2047119140625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 10.0, 11.0, 14.0, 26.0, 38.0, 65.0, 103.0, 124.0, 130.0, 139.0, 107.0, 76.0, 52.0, 36.0, 23.0, 25.0, 6.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.971366882324219, -4.660595893859863, -4.349824905395508, -4.039053916931152, -3.728283166885376, -3.4175121784210205, -3.106741428375244, -2.7959704399108887, -2.485199451446533, -2.1744284629821777, -1.8636575937271118, -1.552886724472046, -1.2421157360076904, -0.931344747543335, -0.620573878288269, -0.3098030090332031, 0.0009679794311523438, 0.31173890829086304, 0.6225098371505737, 0.9332807660102844, 1.2440516948699951, 1.5548226833343506, 1.8655935525894165, 2.1763644218444824, 2.487135410308838, 2.7979063987731934, 3.108677387237549, 3.419448137283325, 3.7302191257476807, 4.040989875793457, 4.3517608642578125, 4.662531852722168, 4.973302841186523, 5.284073829650879, 5.594844818115234, 5.90561580657959, 6.216386795043945, 6.527157783508301, 6.837928295135498, 7.1486992835998535, 7.459470272064209, 7.7702412605285645, 8.081011772155762, 8.391782760620117, 8.702553749084473, 9.013324737548828, 9.324095726013184, 9.634866714477539, 9.945637702941895, 10.25640869140625, 10.567179679870605, 10.877950668334961, 11.188721656799316, 11.499492645263672, 11.810263633728027, 12.121034622192383, 12.431804656982422, 12.742575645446777, 13.053346633911133, 13.364117622375488, 13.674888610839844, 13.9856595993042, 14.296430587768555, 14.607200622558594, 14.917972564697266]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 8.0, 3.0, 7.0, 13.0, 18.0, 21.0, 25.0, 38.0, 55.0, 43.0, 46.0, 58.0, 66.0, 62.0, 74.0, 57.0, 71.0, 52.0, 51.0, 53.0, 40.0, 41.0, 19.0, 21.0, 14.0, 11.0, 6.0, 10.0, 1.0, 4.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71080207824707, -4.533476829528809, -4.356152057647705, -4.178826808929443, -4.00150203704834, -3.8241770267486572, -3.6468520164489746, -3.469526767730713, -3.2922019958496094, -3.1148769855499268, -2.937551975250244, -2.7602269649505615, -2.582901954650879, -2.4055769443511963, -2.2282519340515137, -2.050926685333252, -1.8736016750335693, -1.6962766647338867, -1.518951654434204, -1.3416266441345215, -1.1643016338348389, -0.9869765639305115, -0.8096514940261841, -0.6323264837265015, -0.45500147342681885, -0.27767646312713623, -0.10035142302513123, 0.07697361707687378, 0.2542986273765564, 0.431623637676239, 0.6089487075805664, 0.786273717880249, 0.9635987281799316, 1.1409237384796143, 1.3182487487792969, 1.4955737590789795, 1.672898769378662, 1.8502237796783447, 2.0275487899780273, 2.204874038696289, 2.3821988105773926, 2.559523820877075, 2.736848831176758, 2.9141738414764404, 3.091498851776123, 3.2688238620758057, 3.4461488723754883, 3.62347412109375, 3.8007991313934326, 3.9781241416931152, 4.155449390411377, 4.3327741622924805, 4.510099411010742, 4.687424182891846, 4.864749431610107, 5.042074203491211, 5.219399452209473, 5.396724700927734, 5.574049472808838, 5.7513747215271, 5.928699493408203, 6.106024742126465, 6.283349514007568, 6.46067476272583, 6.637999534606934]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 5.0, 4.0, 10.0, 16.0, 19.0, 26.0, 41.0, 70.0, 128.0, 231.0, 385.0, 639.0, 1260.0, 2465.0, 4933.0, 10348.0, 22996.0, 61482.0, 232337.0, 499731.0, 136399.0, 42056.0, 17089.0, 7727.0, 3781.0, 2000.0, 1079.0, 514.0, 309.0, 178.0, 110.0, 70.0, 30.0, 30.0, 25.0, 12.0, 6.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.03515625, -5.85931396484375, -5.6834716796875, -5.50762939453125, -5.331787109375, -5.15594482421875, -4.9801025390625, -4.80426025390625, -4.62841796875, -4.45257568359375, -4.2767333984375, -4.10089111328125, -3.925048828125, -3.74920654296875, -3.5733642578125, -3.39752197265625, -3.2216796875, -3.04583740234375, -2.8699951171875, -2.69415283203125, -2.518310546875, -2.34246826171875, -2.1666259765625, -1.99078369140625, -1.81494140625, -1.63909912109375, -1.4632568359375, -1.28741455078125, -1.111572265625, -0.93572998046875, -0.7598876953125, -0.58404541015625, -0.408203125, -0.23236083984375, -0.0565185546875, 0.11932373046875, 0.295166015625, 0.47100830078125, 0.6468505859375, 0.82269287109375, 0.99853515625, 1.17437744140625, 1.3502197265625, 1.52606201171875, 1.701904296875, 1.87774658203125, 2.0535888671875, 2.22943115234375, 2.4052734375, 2.58111572265625, 2.7569580078125, 2.93280029296875, 3.108642578125, 3.28448486328125, 3.4603271484375, 3.63616943359375, 3.81201171875, 3.98785400390625, 4.1636962890625, 4.33953857421875, 4.515380859375, 4.69122314453125, 4.8670654296875, 5.04290771484375, 5.21875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 15.0, 14.0, 22.0, 18.0, 36.0, 34.0, 57.0, 46.0, 49.0, 63.0, 59.0, 52.0, 68.0, 67.0, 69.0, 67.0, 36.0, 36.0, 37.0, 32.0, 25.0, 16.0, 16.0, 11.0, 8.0, 10.0, 5.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.2325439453125, -8.847900390625, -8.4632568359375, -8.07861328125, -7.6939697265625, -7.309326171875, -6.9246826171875, -6.5400390625, -6.1553955078125, -5.770751953125, -5.3861083984375, -5.00146484375, -4.6168212890625, -4.232177734375, -3.8475341796875, -3.462890625, -3.0782470703125, -2.693603515625, -2.3089599609375, -1.92431640625, -1.5396728515625, -1.155029296875, -0.7703857421875, -0.3857421875, -0.0010986328125, 0.383544921875, 0.7681884765625, 1.15283203125, 1.5374755859375, 1.922119140625, 2.3067626953125, 2.69140625, 3.0760498046875, 3.460693359375, 3.8453369140625, 4.22998046875, 4.6146240234375, 4.999267578125, 5.3839111328125, 5.7685546875, 6.1531982421875, 6.537841796875, 6.9224853515625, 7.30712890625, 7.6917724609375, 8.076416015625, 8.4610595703125, 8.845703125, 9.2303466796875, 9.614990234375, 9.9996337890625, 10.38427734375, 10.7689208984375, 11.153564453125, 11.5382080078125, 11.9228515625, 12.3074951171875, 12.692138671875, 13.0767822265625, 13.46142578125, 13.8460693359375, 14.230712890625, 14.6153564453125, 15.0]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 10.0, 7.0, 13.0, 7.0, 16.0, 15.0, 19.0, 21.0, 22.0, 29.0, 24.0, 25.0, 31.0, 51.0, 68.0, 155.0, 864.0, 22182.0, 975521.0, 47466.0, 1360.0, 176.0, 98.0, 49.0, 44.0, 47.0, 35.0, 22.0, 31.0, 24.0, 16.0, 22.0, 18.0, 8.0, 11.0, 8.0, 8.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.859375, -26.059814453125, -25.26025390625, -24.460693359375, -23.6611328125, -22.861572265625, -22.06201171875, -21.262451171875, -20.462890625, -19.663330078125, -18.86376953125, -18.064208984375, -17.2646484375, -16.465087890625, -15.66552734375, -14.865966796875, -14.06640625, -13.266845703125, -12.46728515625, -11.667724609375, -10.8681640625, -10.068603515625, -9.26904296875, -8.469482421875, -7.669921875, -6.870361328125, -6.07080078125, -5.271240234375, -4.4716796875, -3.672119140625, -2.87255859375, -2.072998046875, -1.2734375, -0.473876953125, 0.32568359375, 1.125244140625, 1.9248046875, 2.724365234375, 3.52392578125, 4.323486328125, 5.123046875, 5.922607421875, 6.72216796875, 7.521728515625, 8.3212890625, 9.120849609375, 9.92041015625, 10.719970703125, 11.51953125, 12.319091796875, 13.11865234375, 13.918212890625, 14.7177734375, 15.517333984375, 16.31689453125, 17.116455078125, 17.916015625, 18.715576171875, 19.51513671875, 20.314697265625, 21.1142578125, 21.913818359375, 22.71337890625, 23.512939453125, 24.3125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 6.0, 7.0, 12.0, 10.0, 12.0, 11.0, 17.0, 16.0, 21.0, 26.0, 14.0, 27.0, 30.0, 28.0, 29.0, 39.0, 34.0, 49.0, 39.0, 37.0, 44.0, 33.0, 41.0, 47.0, 44.0, 36.0, 35.0, 26.0, 26.0, 22.0, 32.0, 20.0, 27.0, 12.0, 9.0, 10.0, 12.0, 11.0, 14.0, 7.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.1328125, -7.8865966796875, -7.640380859375, -7.3941650390625, -7.14794921875, -6.9017333984375, -6.655517578125, -6.4093017578125, -6.1630859375, -5.9168701171875, -5.670654296875, -5.4244384765625, -5.17822265625, -4.9320068359375, -4.685791015625, -4.4395751953125, -4.193359375, -3.9471435546875, -3.700927734375, -3.4547119140625, -3.20849609375, -2.9622802734375, -2.716064453125, -2.4698486328125, -2.2236328125, -1.9774169921875, -1.731201171875, -1.4849853515625, -1.23876953125, -0.9925537109375, -0.746337890625, -0.5001220703125, -0.25390625, -0.0076904296875, 0.238525390625, 0.4847412109375, 0.73095703125, 0.9771728515625, 1.223388671875, 1.4696044921875, 1.7158203125, 1.9620361328125, 2.208251953125, 2.4544677734375, 2.70068359375, 2.9468994140625, 3.193115234375, 3.4393310546875, 3.685546875, 3.9317626953125, 4.177978515625, 4.4241943359375, 4.67041015625, 4.9166259765625, 5.162841796875, 5.4090576171875, 5.6552734375, 5.9014892578125, 6.147705078125, 6.3939208984375, 6.64013671875, 6.8863525390625, 7.132568359375, 7.3787841796875, 7.625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 10.0, 13.0, 24.0, 28.0, 29.0, 61.0, 117.0, 215.0, 418.0, 1076.0, 3160.0, 13506.0, 106128.0, 788108.0, 116060.0, 14167.0, 3367.0, 1128.0, 452.0, 192.0, 108.0, 57.0, 38.0, 25.0, 17.0, 11.0, 3.0, 9.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.143768310546875, -2.06292724609375, -1.982086181640625, -1.9012451171875, -1.820404052734375, -1.73956298828125, -1.658721923828125, -1.577880859375, -1.497039794921875, -1.41619873046875, -1.335357666015625, -1.2545166015625, -1.173675537109375, -1.09283447265625, -1.011993408203125, -0.93115234375, -0.850311279296875, -0.76947021484375, -0.688629150390625, -0.6077880859375, -0.526947021484375, -0.44610595703125, -0.365264892578125, -0.284423828125, -0.203582763671875, -0.12274169921875, -0.041900634765625, 0.0389404296875, 0.119781494140625, 0.20062255859375, 0.281463623046875, 0.3623046875, 0.443145751953125, 0.52398681640625, 0.604827880859375, 0.6856689453125, 0.766510009765625, 0.84735107421875, 0.928192138671875, 1.009033203125, 1.089874267578125, 1.17071533203125, 1.251556396484375, 1.3323974609375, 1.413238525390625, 1.49407958984375, 1.574920654296875, 1.65576171875, 1.736602783203125, 1.81744384765625, 1.898284912109375, 1.9791259765625, 2.059967041015625, 2.14080810546875, 2.221649169921875, 2.302490234375, 2.383331298828125, 2.46417236328125, 2.545013427734375, 2.6258544921875, 2.706695556640625, 2.78753662109375, 2.868377685546875, 2.94921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 1.0, 8.0, 6.0, 15.0, 22.0, 28.0, 62.0, 100.0, 124.0, 187.0, 162.0, 107.0, 60.0, 57.0, 27.0, 18.0, 11.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004611015319824219, -0.0004478655755519867, -0.0004346296191215515, -0.00042139366269111633, -0.00040815770626068115, -0.00039492174983024597, -0.0003816857933998108, -0.0003684498369693756, -0.00035521388053894043, -0.00034197792410850525, -0.00032874196767807007, -0.0003155060112476349, -0.0003022700548171997, -0.0002890340983867645, -0.00027579814195632935, -0.00026256218552589417, -0.000249326229095459, -0.0002360902726650238, -0.00022285431623458862, -0.00020961835980415344, -0.00019638240337371826, -0.00018314644694328308, -0.0001699104905128479, -0.00015667453408241272, -0.00014343857765197754, -0.00013020262122154236, -0.00011696666479110718, -0.000103730708360672, -9.049475193023682e-05, -7.725879549980164e-05, -6.402283906936646e-05, -5.0786882638931274e-05, -3.7550926208496094e-05, -2.4314969778060913e-05, -1.1079013347625732e-05, 2.1569430828094482e-06, 1.539289951324463e-05, 2.862885594367981e-05, 4.186481237411499e-05, 5.510076880455017e-05, 6.833672523498535e-05, 8.157268166542053e-05, 9.480863809585571e-05, 0.0001080445945262909, 0.00012128055095672607, 0.00013451650738716125, 0.00014775246381759644, 0.00016098842024803162, 0.0001742243766784668, 0.00018746033310890198, 0.00020069628953933716, 0.00021393224596977234, 0.00022716820240020752, 0.0002404041588306427, 0.0002536401152610779, 0.00026687607169151306, 0.00028011202812194824, 0.0002933479845523834, 0.0003065839409828186, 0.0003198198974132538, 0.00033305585384368896, 0.00034629181027412415, 0.0003595277667045593, 0.0003727637231349945, 0.0003859996795654297]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 6.0, 13.0, 19.0, 27.0, 40.0, 52.0, 95.0, 141.0, 190.0, 323.0, 604.0, 1094.0, 2138.0, 4440.0, 10182.0, 26103.0, 85699.0, 359817.0, 408312.0, 98805.0, 29405.0, 11074.0, 4884.0, 2296.0, 1147.0, 672.0, 360.0, 213.0, 135.0, 74.0, 47.0, 51.0, 26.0, 15.0, 9.0, 8.0, 8.0, 3.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1485137939453125, -1.107574462890625, -1.0666351318359375, -1.02569580078125, -0.9847564697265625, -0.943817138671875, -0.9028778076171875, -0.8619384765625, -0.8209991455078125, -0.780059814453125, -0.7391204833984375, -0.69818115234375, -0.6572418212890625, -0.616302490234375, -0.5753631591796875, -0.534423828125, -0.4934844970703125, -0.452545166015625, -0.4116058349609375, -0.37066650390625, -0.3297271728515625, -0.288787841796875, -0.2478485107421875, -0.2069091796875, -0.1659698486328125, -0.125030517578125, -0.0840911865234375, -0.04315185546875, -0.0022125244140625, 0.038726806640625, 0.0796661376953125, 0.12060546875, 0.1615447998046875, 0.202484130859375, 0.2434234619140625, 0.28436279296875, 0.3253021240234375, 0.366241455078125, 0.4071807861328125, 0.4481201171875, 0.4890594482421875, 0.529998779296875, 0.5709381103515625, 0.61187744140625, 0.6528167724609375, 0.693756103515625, 0.7346954345703125, 0.775634765625, 0.8165740966796875, 0.857513427734375, 0.8984527587890625, 0.93939208984375, 0.9803314208984375, 1.021270751953125, 1.0622100830078125, 1.1031494140625, 1.1440887451171875, 1.185028076171875, 1.2259674072265625, 1.26690673828125, 1.3078460693359375, 1.348785400390625, 1.3897247314453125, 1.4306640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 12.0, 15.0, 14.0, 12.0, 25.0, 30.0, 34.0, 48.0, 58.0, 72.0, 84.0, 81.0, 92.0, 84.0, 67.0, 49.0, 36.0, 37.0, 23.0, 13.0, 23.0, 12.0, 12.0, 9.0, 8.0, 4.0, 6.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7802734375, -0.7584304809570312, -0.7365875244140625, -0.7147445678710938, -0.692901611328125, -0.6710586547851562, -0.6492156982421875, -0.6273727416992188, -0.60552978515625, -0.5836868286132812, -0.5618438720703125, -0.5400009155273438, -0.518157958984375, -0.49631500244140625, -0.4744720458984375, -0.45262908935546875, -0.4307861328125, -0.40894317626953125, -0.3871002197265625, -0.36525726318359375, -0.343414306640625, -0.32157135009765625, -0.2997283935546875, -0.27788543701171875, -0.25604248046875, -0.23419952392578125, -0.2123565673828125, -0.19051361083984375, -0.168670654296875, -0.14682769775390625, -0.1249847412109375, -0.10314178466796875, -0.081298828125, -0.05945587158203125, -0.0376129150390625, -0.01576995849609375, 0.006072998046875, 0.02791595458984375, 0.0497589111328125, 0.07160186767578125, 0.09344482421875, 0.11528778076171875, 0.1371307373046875, 0.15897369384765625, 0.180816650390625, 0.20265960693359375, 0.2245025634765625, 0.24634552001953125, 0.2681884765625, 0.29003143310546875, 0.3118743896484375, 0.33371734619140625, 0.355560302734375, 0.37740325927734375, 0.3992462158203125, 0.42108917236328125, 0.44293212890625, 0.46477508544921875, 0.4866180419921875, 0.5084609985351562, 0.530303955078125, 0.5521469116210938, 0.5739898681640625, 0.5958328247070312, 0.61767578125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 21.0, 56.0, 127.0, 323.0, 284.0, 127.0, 45.0, 16.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.40650177001953, -75.82705688476562, -74.24761199951172, -72.66816711425781, -71.0887222290039, -69.50927734375, -67.9298324584961, -66.35038757324219, -64.77095031738281, -63.191505432128906, -61.612060546875, -60.032615661621094, -58.45317077636719, -56.87372970581055, -55.29428482055664, -53.714839935302734, -52.13539123535156, -50.555946350097656, -48.97650146484375, -47.397056579589844, -45.81761169433594, -44.2381706237793, -42.65872573852539, -41.079280853271484, -39.49983596801758, -37.92039108276367, -36.340946197509766, -34.76150131225586, -33.18206024169922, -31.60261344909668, -30.023170471191406, -28.4437255859375, -26.864280700683594, -25.284835815429688, -23.70539093017578, -22.125947952270508, -20.5465030670166, -18.967058181762695, -17.387615203857422, -15.808170318603516, -14.22872543334961, -12.649280548095703, -11.069836616516113, -9.490392684936523, -7.910947799682617, -6.331503391265869, -4.752058982849121, -3.1726150512695312, -1.593170166015625, -0.013725757598876953, 1.565718650817871, 3.145163059234619, 4.724607467651367, 6.304051876068115, 7.883496284484863, 9.462940216064453, 11.04238510131836, 12.621829986572266, 14.201273918151855, 15.780717849731445, 17.36016273498535, 18.939607620239258, 20.51905059814453, 22.098495483398438, 23.677940368652344]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 5.0, 8.0, 8.0, 11.0, 14.0, 24.0, 25.0, 21.0, 30.0, 36.0, 33.0, 32.0, 40.0, 40.0, 63.0, 36.0, 46.0, 43.0, 53.0, 48.0, 37.0, 40.0, 38.0, 34.0, 33.0, 27.0, 21.0, 22.0, 15.0, 20.0, 16.0, 16.0, 9.0, 9.0, 11.0, 4.0, 8.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.492140769958496, -12.017292976379395, -11.542445182800293, -11.067597389221191, -10.592748641967773, -10.117900848388672, -9.64305305480957, -9.168205261230469, -8.693357467651367, -8.218509674072266, -7.743661880493164, -7.268813610076904, -6.793965816497803, -6.319118022918701, -5.844269752502441, -5.36942195892334, -4.894574165344238, -4.419726371765137, -3.944878339767456, -3.4700303077697754, -2.995182514190674, -2.5203347206115723, -2.0454866886138916, -1.570638656616211, -1.0957908630371094, -0.6209429502487183, -0.14609503746032715, 0.32875287532806396, 0.8036007881164551, 1.2784485816955566, 1.7532966136932373, 2.228144645690918, 2.702991485595703, 3.1778392791748047, 3.6526873111724854, 4.127535343170166, 4.602383136749268, 5.077230930328369, 5.552079200744629, 6.0269269943237305, 6.501774787902832, 6.976622581481934, 7.451470375061035, 7.926318645477295, 8.401166915893555, 8.876014709472656, 9.350862503051758, 9.82571029663086, 10.300558090209961, 10.775405883789062, 11.250253677368164, 11.725101470947266, 12.199949264526367, 12.674797058105469, 13.149645805358887, 13.624493598937988, 14.09934139251709, 14.574189186096191, 15.049036979675293, 15.523884773254395, 15.998733520507812, 16.473581314086914, 16.948429107666016, 17.423276901245117, 17.89812469482422]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 10.0, 16.0, 20.0, 36.0, 42.0, 72.0, 123.0, 203.0, 289.0, 505.0, 918.0, 1544.0, 3225.0, 7418.0, 20535.0, 79699.0, 509986.0, 2501218.0, 903084.0, 120599.0, 27382.0, 9045.0, 3914.0, 1892.0, 972.0, 549.0, 315.0, 218.0, 128.0, 106.0, 65.0, 37.0, 23.0, 22.0, 22.0, 9.0, 3.0, 9.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.89453125, -7.62811279296875, -7.3616943359375, -7.09527587890625, -6.828857421875, -6.56243896484375, -6.2960205078125, -6.02960205078125, -5.76318359375, -5.49676513671875, -5.2303466796875, -4.96392822265625, -4.697509765625, -4.43109130859375, -4.1646728515625, -3.89825439453125, -3.6318359375, -3.36541748046875, -3.0989990234375, -2.83258056640625, -2.566162109375, -2.29974365234375, -2.0333251953125, -1.76690673828125, -1.50048828125, -1.23406982421875, -0.9676513671875, -0.70123291015625, -0.434814453125, -0.16839599609375, 0.0980224609375, 0.36444091796875, 0.630859375, 0.89727783203125, 1.1636962890625, 1.43011474609375, 1.696533203125, 1.96295166015625, 2.2293701171875, 2.49578857421875, 2.76220703125, 3.02862548828125, 3.2950439453125, 3.56146240234375, 3.827880859375, 4.09429931640625, 4.3607177734375, 4.62713623046875, 4.8935546875, 5.15997314453125, 5.4263916015625, 5.69281005859375, 5.959228515625, 6.22564697265625, 6.4920654296875, 6.75848388671875, 7.02490234375, 7.29132080078125, 7.5577392578125, 7.82415771484375, 8.090576171875, 8.35699462890625, 8.6234130859375, 8.88983154296875, 9.15625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 8.0, 3.0, 6.0, 5.0, 6.0, 7.0, 12.0, 14.0, 22.0, 22.0, 26.0, 32.0, 42.0, 43.0, 49.0, 40.0, 59.0, 57.0, 58.0, 58.0, 54.0, 66.0, 55.0, 40.0, 34.0, 42.0, 26.0, 18.0, 23.0, 11.0, 13.0, 20.0, 9.0, 9.0, 4.0, 7.0, 2.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.70294189453125, -6.4996337890625, -6.29632568359375, -6.093017578125, -5.88970947265625, -5.6864013671875, -5.48309326171875, -5.27978515625, -5.07647705078125, -4.8731689453125, -4.66986083984375, -4.466552734375, -4.26324462890625, -4.0599365234375, -3.85662841796875, -3.6533203125, -3.45001220703125, -3.2467041015625, -3.04339599609375, -2.840087890625, -2.63677978515625, -2.4334716796875, -2.23016357421875, -2.02685546875, -1.82354736328125, -1.6202392578125, -1.41693115234375, -1.213623046875, -1.01031494140625, -0.8070068359375, -0.60369873046875, -0.400390625, -0.19708251953125, 0.0062255859375, 0.20953369140625, 0.412841796875, 0.61614990234375, 0.8194580078125, 1.02276611328125, 1.22607421875, 1.42938232421875, 1.6326904296875, 1.83599853515625, 2.039306640625, 2.24261474609375, 2.4459228515625, 2.64923095703125, 2.8525390625, 3.05584716796875, 3.2591552734375, 3.46246337890625, 3.665771484375, 3.86907958984375, 4.0723876953125, 4.27569580078125, 4.47900390625, 4.68231201171875, 4.8856201171875, 5.08892822265625, 5.292236328125, 5.49554443359375, 5.6988525390625, 5.90216064453125, 6.10546875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 13.0, 12.0, 32.0, 40.0, 61.0, 98.0, 158.0, 337.0, 1360.0, 12796.0, 2614336.0, 1552172.0, 10860.0, 1222.0, 303.0, 171.0, 95.0, 68.0, 44.0, 28.0, 21.0, 14.0, 8.0, 5.0, 3.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.3125, -16.5244140625, -15.736328125, -14.9482421875, -14.16015625, -13.3720703125, -12.583984375, -11.7958984375, -11.0078125, -10.2197265625, -9.431640625, -8.6435546875, -7.85546875, -7.0673828125, -6.279296875, -5.4912109375, -4.703125, -3.9150390625, -3.126953125, -2.3388671875, -1.55078125, -0.7626953125, 0.025390625, 0.8134765625, 1.6015625, 2.3896484375, 3.177734375, 3.9658203125, 4.75390625, 5.5419921875, 6.330078125, 7.1181640625, 7.90625, 8.6943359375, 9.482421875, 10.2705078125, 11.05859375, 11.8466796875, 12.634765625, 13.4228515625, 14.2109375, 14.9990234375, 15.787109375, 16.5751953125, 17.36328125, 18.1513671875, 18.939453125, 19.7275390625, 20.515625, 21.3037109375, 22.091796875, 22.8798828125, 23.66796875, 24.4560546875, 25.244140625, 26.0322265625, 26.8203125, 27.6083984375, 28.396484375, 29.1845703125, 29.97265625, 30.7607421875, 31.548828125, 32.3369140625, 33.125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 10.0, 12.0, 20.0, 21.0, 37.0, 64.0, 88.0, 135.0, 251.0, 449.0, 771.0, 935.0, 575.0, 279.0, 150.0, 98.0, 62.0, 41.0, 25.0, 16.0, 14.0, 11.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5, -4.38525390625, -4.2705078125, -4.15576171875, -4.041015625, -3.92626953125, -3.8115234375, -3.69677734375, -3.58203125, -3.46728515625, -3.3525390625, -3.23779296875, -3.123046875, -3.00830078125, -2.8935546875, -2.77880859375, -2.6640625, -2.54931640625, -2.4345703125, -2.31982421875, -2.205078125, -2.09033203125, -1.9755859375, -1.86083984375, -1.74609375, -1.63134765625, -1.5166015625, -1.40185546875, -1.287109375, -1.17236328125, -1.0576171875, -0.94287109375, -0.828125, -0.71337890625, -0.5986328125, -0.48388671875, -0.369140625, -0.25439453125, -0.1396484375, -0.02490234375, 0.08984375, 0.20458984375, 0.3193359375, 0.43408203125, 0.548828125, 0.66357421875, 0.7783203125, 0.89306640625, 1.0078125, 1.12255859375, 1.2373046875, 1.35205078125, 1.466796875, 1.58154296875, 1.6962890625, 1.81103515625, 1.92578125, 2.04052734375, 2.1552734375, 2.27001953125, 2.384765625, 2.49951171875, 2.6142578125, 2.72900390625, 2.84375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 8.0, 3.0, 6.0, 14.0, 21.0, 37.0, 42.0, 59.0, 86.0, 102.0, 143.0, 115.0, 101.0, 92.0, 57.0, 31.0, 26.0, 26.0, 15.0, 6.0, 5.0, 5.0, 1.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.095888137817383, -7.672084331512451, -7.2482805252075195, -6.824477195739746, -6.4006733894348145, -5.976869583129883, -5.553066253662109, -5.129262447357178, -4.705458641052246, -4.2816548347473145, -3.857851266860962, -3.4340476989746094, -3.0102438926696777, -2.586440086364746, -2.1626365184783936, -1.738832950592041, -1.3150291442871094, -0.8912254571914673, -0.4674217700958252, -0.043618083000183105, 0.380185604095459, 0.8039894104003906, 1.2277929782867432, 1.6515965461730957, 2.0754003524780273, 2.499204158782959, 2.9230077266693115, 3.346811294555664, 3.7706151008605957, 4.194418907165527, 4.618222236633301, 5.042026042938232, 5.465829849243164, 5.889633655548096, 6.313437461853027, 6.737240791320801, 7.161044597625732, 7.584848403930664, 8.008651733398438, 8.432455062866211, 8.8562593460083, 9.280062675476074, 9.703866958618164, 10.127670288085938, 10.551473617553711, 10.9752779006958, 11.399081230163574, 11.822885513305664, 12.246688842773438, 12.670492172241211, 13.0942964553833, 13.518099784851074, 13.941904067993164, 14.365707397460938, 14.789510726928711, 15.213314056396484, 15.637118339538574, 16.060922622680664, 16.484725952148438, 16.90852928161621, 17.332332611083984, 17.75613784790039, 18.179941177368164, 18.603744506835938, 19.02754783630371]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 7.0, 17.0, 10.0, 22.0, 19.0, 34.0, 35.0, 41.0, 37.0, 31.0, 56.0, 70.0, 54.0, 62.0, 70.0, 65.0, 57.0, 52.0, 48.0, 34.0, 41.0, 28.0, 24.0, 20.0, 11.0, 17.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.007919311523438, -7.742435455322266, -7.476951599121094, -7.211467266082764, -6.945983409881592, -6.68049955368042, -6.41501522064209, -6.149531364440918, -5.884047508239746, -5.618563652038574, -5.353079795837402, -5.087595462799072, -4.8221116065979, -4.5566277503967285, -4.291143417358398, -4.025659561157227, -3.7601757049560547, -3.494691848754883, -3.229207754135132, -2.963723659515381, -2.698239803314209, -2.432755947113037, -2.167271852493286, -1.9017878770828247, -1.6363039016723633, -1.3708199262619019, -1.1053359508514404, -0.839851975440979, -0.5743680000305176, -0.30888402462005615, -0.04340004920959473, 0.2220839262008667, 0.4875679016113281, 0.7530518770217896, 1.018535852432251, 1.2840198278427124, 1.5495038032531738, 1.8149877786636353, 2.0804717540740967, 2.3459558486938477, 2.6114397048950195, 2.8769235610961914, 3.1424076557159424, 3.4078917503356934, 3.6733756065368652, 3.938859462738037, 4.204343795776367, 4.469827651977539, 4.735311508178711, 5.000795364379883, 5.266279220581055, 5.531763553619385, 5.797247409820557, 6.0627312660217285, 6.328215599060059, 6.5936994552612305, 6.859183311462402, 7.124667167663574, 7.390151023864746, 7.655635356903076, 7.921119213104248, 8.186603546142578, 8.45208740234375, 8.717571258544922, 8.983055114746094]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 15.0, 12.0, 22.0, 35.0, 39.0, 48.0, 98.0, 179.0, 291.0, 570.0, 1154.0, 2525.0, 5871.0, 14737.0, 39874.0, 119622.0, 390008.0, 324123.0, 95431.0, 32272.0, 12361.0, 4962.0, 2137.0, 982.0, 519.0, 257.0, 156.0, 69.0, 56.0, 35.0, 27.0, 20.0, 11.0, 9.0, 6.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.164337158203125, -2.09429931640625, -2.024261474609375, -1.9542236328125, -1.884185791015625, -1.81414794921875, -1.744110107421875, -1.674072265625, -1.604034423828125, -1.53399658203125, -1.463958740234375, -1.3939208984375, -1.323883056640625, -1.25384521484375, -1.183807373046875, -1.11376953125, -1.043731689453125, -0.97369384765625, -0.903656005859375, -0.8336181640625, -0.763580322265625, -0.69354248046875, -0.623504638671875, -0.553466796875, -0.483428955078125, -0.41339111328125, -0.343353271484375, -0.2733154296875, -0.203277587890625, -0.13323974609375, -0.063201904296875, 0.0068359375, 0.076873779296875, 0.14691162109375, 0.216949462890625, 0.2869873046875, 0.357025146484375, 0.42706298828125, 0.497100830078125, 0.567138671875, 0.637176513671875, 0.70721435546875, 0.777252197265625, 0.8472900390625, 0.917327880859375, 0.98736572265625, 1.057403564453125, 1.12744140625, 1.197479248046875, 1.26751708984375, 1.337554931640625, 1.4075927734375, 1.477630615234375, 1.54766845703125, 1.617706298828125, 1.687744140625, 1.757781982421875, 1.82781982421875, 1.897857666015625, 1.9678955078125, 2.037933349609375, 2.10797119140625, 2.178009033203125, 2.248046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 10.0, 12.0, 21.0, 17.0, 34.0, 39.0, 45.0, 47.0, 59.0, 69.0, 66.0, 68.0, 80.0, 77.0, 68.0, 59.0, 41.0, 39.0, 38.0, 28.0, 17.0, 14.0, 12.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1796875, -4.988525390625, -4.79736328125, -4.606201171875, -4.4150390625, -4.223876953125, -4.03271484375, -3.841552734375, -3.650390625, -3.459228515625, -3.26806640625, -3.076904296875, -2.8857421875, -2.694580078125, -2.50341796875, -2.312255859375, -2.12109375, -1.929931640625, -1.73876953125, -1.547607421875, -1.3564453125, -1.165283203125, -0.97412109375, -0.782958984375, -0.591796875, -0.400634765625, -0.20947265625, -0.018310546875, 0.1728515625, 0.364013671875, 0.55517578125, 0.746337890625, 0.9375, 1.128662109375, 1.31982421875, 1.510986328125, 1.7021484375, 1.893310546875, 2.08447265625, 2.275634765625, 2.466796875, 2.657958984375, 2.84912109375, 3.040283203125, 3.2314453125, 3.422607421875, 3.61376953125, 3.804931640625, 3.99609375, 4.187255859375, 4.37841796875, 4.569580078125, 4.7607421875, 4.951904296875, 5.14306640625, 5.334228515625, 5.525390625, 5.716552734375, 5.90771484375, 6.098876953125, 6.2900390625, 6.481201171875, 6.67236328125, 6.863525390625, 7.0546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 8.0, 11.0, 23.0, 24.0, 25.0, 48.0, 71.0, 84.0, 187.0, 270.0, 505.0, 870.0, 1702.0, 3428.0, 7916.0, 19458.0, 52118.0, 156363.0, 396942.0, 268557.0, 86461.0, 30743.0, 12315.0, 5312.0, 2339.0, 1173.0, 619.0, 339.0, 242.0, 132.0, 85.0, 63.0, 36.0, 22.0, 27.0, 10.0, 8.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8203125, -1.7610931396484375, -1.701873779296875, -1.6426544189453125, -1.58343505859375, -1.5242156982421875, -1.464996337890625, -1.4057769775390625, -1.3465576171875, -1.2873382568359375, -1.228118896484375, -1.1688995361328125, -1.10968017578125, -1.0504608154296875, -0.991241455078125, -0.9320220947265625, -0.872802734375, -0.8135833740234375, -0.754364013671875, -0.6951446533203125, -0.63592529296875, -0.5767059326171875, -0.517486572265625, -0.4582672119140625, -0.3990478515625, -0.3398284912109375, -0.280609130859375, -0.2213897705078125, -0.16217041015625, -0.1029510498046875, -0.043731689453125, 0.0154876708984375, 0.07470703125, 0.1339263916015625, 0.193145751953125, 0.2523651123046875, 0.31158447265625, 0.3708038330078125, 0.430023193359375, 0.4892425537109375, 0.5484619140625, 0.6076812744140625, 0.666900634765625, 0.7261199951171875, 0.78533935546875, 0.8445587158203125, 0.903778076171875, 0.9629974365234375, 1.022216796875, 1.0814361572265625, 1.140655517578125, 1.1998748779296875, 1.25909423828125, 1.3183135986328125, 1.377532958984375, 1.4367523193359375, 1.4959716796875, 1.5551910400390625, 1.614410400390625, 1.6736297607421875, 1.73284912109375, 1.7920684814453125, 1.851287841796875, 1.9105072021484375, 1.9697265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 10.0, 7.0, 5.0, 11.0, 9.0, 8.0, 14.0, 14.0, 31.0, 24.0, 30.0, 33.0, 36.0, 30.0, 41.0, 39.0, 43.0, 42.0, 34.0, 44.0, 56.0, 52.0, 52.0, 46.0, 35.0, 27.0, 34.0, 33.0, 23.0, 27.0, 19.0, 13.0, 19.0, 7.0, 6.0, 9.0, 5.0, 5.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-8.3984375, -8.14532470703125, -7.8922119140625, -7.63909912109375, -7.385986328125, -7.13287353515625, -6.8797607421875, -6.62664794921875, -6.37353515625, -6.12042236328125, -5.8673095703125, -5.61419677734375, -5.361083984375, -5.10797119140625, -4.8548583984375, -4.60174560546875, -4.3486328125, -4.09552001953125, -3.8424072265625, -3.58929443359375, -3.336181640625, -3.08306884765625, -2.8299560546875, -2.57684326171875, -2.32373046875, -2.07061767578125, -1.8175048828125, -1.56439208984375, -1.311279296875, -1.05816650390625, -0.8050537109375, -0.55194091796875, -0.298828125, -0.04571533203125, 0.2073974609375, 0.46051025390625, 0.713623046875, 0.96673583984375, 1.2198486328125, 1.47296142578125, 1.72607421875, 1.97918701171875, 2.2322998046875, 2.48541259765625, 2.738525390625, 2.99163818359375, 3.2447509765625, 3.49786376953125, 3.7509765625, 4.00408935546875, 4.2572021484375, 4.51031494140625, 4.763427734375, 5.01654052734375, 5.2696533203125, 5.52276611328125, 5.77587890625, 6.02899169921875, 6.2821044921875, 6.53521728515625, 6.788330078125, 7.04144287109375, 7.2945556640625, 7.54766845703125, 7.80078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 5.0, 7.0, 8.0, 11.0, 26.0, 36.0, 82.0, 125.0, 238.0, 529.0, 1209.0, 3251.0, 10640.0, 46930.0, 315730.0, 545301.0, 97980.0, 18297.0, 5008.0, 1716.0, 745.0, 312.0, 163.0, 80.0, 49.0, 22.0, 17.0, 13.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.1403656005859375, -1.104949951171875, -1.0695343017578125, -1.03411865234375, -0.9987030029296875, -0.963287353515625, -0.9278717041015625, -0.8924560546875, -0.8570404052734375, -0.821624755859375, -0.7862091064453125, -0.75079345703125, -0.7153778076171875, -0.679962158203125, -0.6445465087890625, -0.609130859375, -0.5737152099609375, -0.538299560546875, -0.5028839111328125, -0.46746826171875, -0.4320526123046875, -0.396636962890625, -0.3612213134765625, -0.3258056640625, -0.2903900146484375, -0.254974365234375, -0.2195587158203125, -0.18414306640625, -0.1487274169921875, -0.113311767578125, -0.0778961181640625, -0.04248046875, -0.0070648193359375, 0.028350830078125, 0.0637664794921875, 0.09918212890625, 0.1345977783203125, 0.170013427734375, 0.2054290771484375, 0.2408447265625, 0.2762603759765625, 0.311676025390625, 0.3470916748046875, 0.38250732421875, 0.4179229736328125, 0.453338623046875, 0.4887542724609375, 0.524169921875, 0.5595855712890625, 0.595001220703125, 0.6304168701171875, 0.66583251953125, 0.7012481689453125, 0.736663818359375, 0.7720794677734375, 0.8074951171875, 0.8429107666015625, 0.878326416015625, 0.9137420654296875, 0.94915771484375, 0.9845733642578125, 1.019989013671875, 1.0554046630859375, 1.0908203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 7.0, 8.0, 13.0, 15.0, 20.0, 27.0, 30.0, 35.0, 41.0, 59.0, 63.0, 69.0, 66.0, 80.0, 59.0, 66.0, 48.0, 63.0, 46.0, 24.0, 33.0, 22.0, 17.0, 10.0, 9.0, 9.0, 7.0, 10.0, 5.0, 3.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003364086151123047, -0.0003260299563407898, -0.0003156512975692749, -0.00030527263879776, -0.0002948939800262451, -0.0002845153212547302, -0.00027413666248321533, -0.00026375800371170044, -0.00025337934494018555, -0.00024300068616867065, -0.00023262202739715576, -0.00022224336862564087, -0.00021186470985412598, -0.00020148605108261108, -0.0001911073923110962, -0.0001807287335395813, -0.0001703500747680664, -0.00015997141599655151, -0.00014959275722503662, -0.00013921409845352173, -0.00012883543968200684, -0.00011845678091049194, -0.00010807812213897705, -9.769946336746216e-05, -8.732080459594727e-05, -7.694214582443237e-05, -6.656348705291748e-05, -5.618482828140259e-05, -4.5806169509887695e-05, -3.54275107383728e-05, -2.504885196685791e-05, -1.4670193195343018e-05, -4.291534423828125e-06, 6.087124347686768e-06, 1.646578311920166e-05, 2.6844441890716553e-05, 3.7223100662231445e-05, 4.760175943374634e-05, 5.798041820526123e-05, 6.835907697677612e-05, 7.873773574829102e-05, 8.911639451980591e-05, 9.94950532913208e-05, 0.0001098737120628357, 0.00012025237083435059, 0.00013063102960586548, 0.00014100968837738037, 0.00015138834714889526, 0.00016176700592041016, 0.00017214566469192505, 0.00018252432346343994, 0.00019290298223495483, 0.00020328164100646973, 0.00021366029977798462, 0.0002240389585494995, 0.0002344176173210144, 0.0002447962760925293, 0.0002551749348640442, 0.0002655535936355591, 0.000275932252407074, 0.00028631091117858887, 0.00029668956995010376, 0.00030706822872161865, 0.00031744688749313354, 0.00032782554626464844]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 13.0, 14.0, 16.0, 23.0, 33.0, 57.0, 117.0, 224.0, 501.0, 1394.0, 4340.0, 16387.0, 87127.0, 485567.0, 372936.0, 61461.0, 12617.0, 3564.0, 1184.0, 463.0, 214.0, 123.0, 66.0, 23.0, 18.0, 22.0, 12.0, 6.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2431640625, -1.20947265625, -1.17578125, -1.14208984375, -1.1083984375, -1.07470703125, -1.041015625, -1.00732421875, -0.9736328125, -0.93994140625, -0.90625, -0.87255859375, -0.8388671875, -0.80517578125, -0.771484375, -0.73779296875, -0.7041015625, -0.67041015625, -0.63671875, -0.60302734375, -0.5693359375, -0.53564453125, -0.501953125, -0.46826171875, -0.4345703125, -0.40087890625, -0.3671875, -0.33349609375, -0.2998046875, -0.26611328125, -0.232421875, -0.19873046875, -0.1650390625, -0.13134765625, -0.09765625, -0.06396484375, -0.0302734375, 0.00341796875, 0.037109375, 0.07080078125, 0.1044921875, 0.13818359375, 0.171875, 0.20556640625, 0.2392578125, 0.27294921875, 0.306640625, 0.34033203125, 0.3740234375, 0.40771484375, 0.44140625, 0.47509765625, 0.5087890625, 0.54248046875, 0.576171875, 0.60986328125, 0.6435546875, 0.67724609375, 0.7109375, 0.74462890625, 0.7783203125, 0.81201171875, 0.845703125, 0.87939453125, 0.9130859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 4.0, 10.0, 17.0, 15.0, 13.0, 20.0, 31.0, 53.0, 52.0, 55.0, 70.0, 61.0, 64.0, 53.0, 70.0, 69.0, 65.0, 50.0, 32.0, 32.0, 28.0, 20.0, 18.0, 18.0, 12.0, 14.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1510009765625, -0.14468955993652344, -0.13837814331054688, -0.1320667266845703, -0.12575531005859375, -0.11944389343261719, -0.11313247680664062, -0.10682106018066406, -0.1005096435546875, -0.09419822692871094, -0.08788681030273438, -0.08157539367675781, -0.07526397705078125, -0.06895256042480469, -0.06264114379882812, -0.05632972717285156, -0.050018310546875, -0.04370689392089844, -0.037395477294921875, -0.031084060668945312, -0.02477264404296875, -0.018461227416992188, -0.012149810791015625, -0.0058383941650390625, 0.0004730224609375, 0.0067844390869140625, 0.013095855712890625, 0.019407272338867188, 0.02571868896484375, 0.03203010559082031, 0.038341522216796875, 0.04465293884277344, 0.05096435546875, 0.05727577209472656, 0.06358718872070312, 0.06989860534667969, 0.07621002197265625, 0.08252143859863281, 0.08883285522460938, 0.09514427185058594, 0.1014556884765625, 0.10776710510253906, 0.11407852172851562, 0.12038993835449219, 0.12670135498046875, 0.1330127716064453, 0.13932418823242188, 0.14563560485839844, 0.151947021484375, 0.15825843811035156, 0.16456985473632812, 0.1708812713623047, 0.17719268798828125, 0.1835041046142578, 0.18981552124023438, 0.19612693786621094, 0.2024383544921875, 0.20874977111816406, 0.21506118774414062, 0.2213726043701172, 0.22768402099609375, 0.2339954376220703, 0.24030685424804688, 0.24661827087402344, 0.2529296875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 8.0, 17.0, 12.0, 36.0, 46.0, 86.0, 123.0, 156.0, 174.0, 134.0, 81.0, 46.0, 37.0, 19.0, 9.0, 8.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.988353252410889, -4.659221172332764, -4.330089092254639, -4.000957012176514, -3.6718246936798096, -3.3426926136016846, -3.0135602951049805, -2.6844282150268555, -2.3552961349487305, -2.0261640548706055, -1.697031855583191, -1.3678996562957764, -1.0387675762176514, -0.7096354961395264, -0.3805032968521118, -0.051371097564697266, 0.27776098251342773, 0.6068931221961975, 0.9360252618789673, 1.2651574611663818, 1.5942895412445068, 1.9234216213226318, 2.252553939819336, 2.581686019897461, 2.910818099975586, 3.239950180053711, 3.569082260131836, 3.89821457862854, 4.227346420288086, 4.556478500366211, 4.885611057281494, 5.214743137359619, 5.543874740600586, 5.873006820678711, 6.202138900756836, 6.531270980834961, 6.860403060913086, 7.189535140991211, 7.518667697906494, 7.847799777984619, 8.176931381225586, 8.506063461303711, 8.835195541381836, 9.164327621459961, 9.493459701538086, 9.822591781616211, 10.151723861694336, 10.480855941772461, 10.809988975524902, 11.139121055603027, 11.468253135681152, 11.797385215759277, 12.126517295837402, 12.455649375915527, 12.784781455993652, 13.113914489746094, 13.443046569824219, 13.772178649902344, 14.101310729980469, 14.430442810058594, 14.759574890136719, 15.088706970214844, 15.417839050292969, 15.746971130371094, 16.07610321044922]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 5.0, 5.0, 11.0, 22.0, 14.0, 30.0, 35.0, 47.0, 34.0, 52.0, 73.0, 72.0, 68.0, 78.0, 79.0, 69.0, 65.0, 51.0, 34.0, 33.0, 31.0, 20.0, 18.0, 18.0, 11.0, 9.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.821997165679932, -4.639649391174316, -4.457301616668701, -4.274953842163086, -4.092606067657471, -3.9102582931518555, -3.727910280227661, -3.545562505722046, -3.3632147312164307, -3.1808669567108154, -2.9985191822052, -2.816171169281006, -2.6338233947753906, -2.4514756202697754, -2.26912784576416, -2.086780071258545, -1.9044322967529297, -1.7220845222473145, -1.5397367477416992, -1.3573888540267944, -1.1750410795211792, -0.992693305015564, -0.8103454113006592, -0.627997636795044, -0.4456498622894287, -0.2633020579814911, -0.08095425367355347, 0.10139358043670654, 0.2837413549423218, 0.466089129447937, 0.6484370231628418, 0.830784797668457, 1.013132095336914, 1.1954798698425293, 1.3778276443481445, 1.5601755380630493, 1.7425233125686646, 1.9248710870742798, 2.1072189807891846, 2.2895667552948, 2.471914529800415, 2.6542623043060303, 2.8366100788116455, 3.01895809173584, 3.201305866241455, 3.3836536407470703, 3.5660014152526855, 3.748349189758301, 3.930696964263916, 4.113044738769531, 4.2953925132751465, 4.477740287780762, 4.660088062286377, 4.842435836791992, 5.024784088134766, 5.207131385803223, 5.389479637145996, 5.571827411651611, 5.754175186157227, 5.936522960662842, 6.118870735168457, 6.301218509674072, 6.4835662841796875, 6.665914535522461, 6.848261833190918]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 6.0, 5.0, 5.0, 12.0, 10.0, 10.0, 14.0, 38.0, 37.0, 70.0, 189.0, 625.0, 2711.0, 18816.0, 242512.0, 723554.0, 52028.0, 6149.0, 1173.0, 298.0, 105.0, 57.0, 39.0, 22.0, 16.0, 12.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.3125, -10.98193359375, -10.6513671875, -10.32080078125, -9.990234375, -9.65966796875, -9.3291015625, -8.99853515625, -8.66796875, -8.33740234375, -8.0068359375, -7.67626953125, -7.345703125, -7.01513671875, -6.6845703125, -6.35400390625, -6.0234375, -5.69287109375, -5.3623046875, -5.03173828125, -4.701171875, -4.37060546875, -4.0400390625, -3.70947265625, -3.37890625, -3.04833984375, -2.7177734375, -2.38720703125, -2.056640625, -1.72607421875, -1.3955078125, -1.06494140625, -0.734375, -0.40380859375, -0.0732421875, 0.25732421875, 0.587890625, 0.91845703125, 1.2490234375, 1.57958984375, 1.91015625, 2.24072265625, 2.5712890625, 2.90185546875, 3.232421875, 3.56298828125, 3.8935546875, 4.22412109375, 4.5546875, 4.88525390625, 5.2158203125, 5.54638671875, 5.876953125, 6.20751953125, 6.5380859375, 6.86865234375, 7.19921875, 7.52978515625, 7.8603515625, 8.19091796875, 8.521484375, 8.85205078125, 9.1826171875, 9.51318359375, 9.84375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 6.0, 10.0, 9.0, 7.0, 17.0, 24.0, 26.0, 34.0, 38.0, 54.0, 57.0, 63.0, 76.0, 61.0, 67.0, 69.0, 65.0, 65.0, 46.0, 45.0, 29.0, 29.0, 20.0, 17.0, 20.0, 11.0, 4.0, 4.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.4603271484375, -8.076904296875, -7.6934814453125, -7.31005859375, -6.9266357421875, -6.543212890625, -6.1597900390625, -5.7763671875, -5.3929443359375, -5.009521484375, -4.6260986328125, -4.24267578125, -3.8592529296875, -3.475830078125, -3.0924072265625, -2.708984375, -2.3255615234375, -1.942138671875, -1.5587158203125, -1.17529296875, -0.7918701171875, -0.408447265625, -0.0250244140625, 0.3583984375, 0.7418212890625, 1.125244140625, 1.5086669921875, 1.89208984375, 2.2755126953125, 2.658935546875, 3.0423583984375, 3.42578125, 3.8092041015625, 4.192626953125, 4.5760498046875, 4.95947265625, 5.3428955078125, 5.726318359375, 6.1097412109375, 6.4931640625, 6.8765869140625, 7.260009765625, 7.6434326171875, 8.02685546875, 8.4102783203125, 8.793701171875, 9.1771240234375, 9.560546875, 9.9439697265625, 10.327392578125, 10.7108154296875, 11.09423828125, 11.4776611328125, 11.861083984375, 12.2445068359375, 12.6279296875, 13.0113525390625, 13.394775390625, 13.7781982421875, 14.16162109375, 14.5450439453125, 14.928466796875, 15.3118896484375, 15.6953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 5.0, 6.0, 8.0, 7.0, 10.0, 13.0, 17.0, 16.0, 22.0, 32.0, 33.0, 45.0, 67.0, 45.0, 61.0, 78.0, 97.0, 119.0, 158.0, 351.0, 1162.0, 7586.0, 160464.0, 838749.0, 34911.0, 2867.0, 653.0, 239.0, 130.0, 95.0, 77.0, 62.0, 56.0, 61.0, 49.0, 37.0, 28.0, 27.0, 27.0, 16.0, 12.0, 12.0, 13.0, 4.0, 6.0, 4.0, 8.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-12.2578125, -11.8895263671875, -11.521240234375, -11.1529541015625, -10.78466796875, -10.4163818359375, -10.048095703125, -9.6798095703125, -9.3115234375, -8.9432373046875, -8.574951171875, -8.2066650390625, -7.83837890625, -7.4700927734375, -7.101806640625, -6.7335205078125, -6.365234375, -5.9969482421875, -5.628662109375, -5.2603759765625, -4.89208984375, -4.5238037109375, -4.155517578125, -3.7872314453125, -3.4189453125, -3.0506591796875, -2.682373046875, -2.3140869140625, -1.94580078125, -1.5775146484375, -1.209228515625, -0.8409423828125, -0.47265625, -0.1043701171875, 0.263916015625, 0.6322021484375, 1.00048828125, 1.3687744140625, 1.737060546875, 2.1053466796875, 2.4736328125, 2.8419189453125, 3.210205078125, 3.5784912109375, 3.94677734375, 4.3150634765625, 4.683349609375, 5.0516357421875, 5.419921875, 5.7882080078125, 6.156494140625, 6.5247802734375, 6.89306640625, 7.2613525390625, 7.629638671875, 7.9979248046875, 8.3662109375, 8.7344970703125, 9.102783203125, 9.4710693359375, 9.83935546875, 10.2076416015625, 10.575927734375, 10.9442138671875, 11.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 2.0, 14.0, 6.0, 5.0, 12.0, 17.0, 12.0, 16.0, 23.0, 30.0, 23.0, 17.0, 23.0, 27.0, 24.0, 27.0, 31.0, 24.0, 34.0, 46.0, 41.0, 31.0, 40.0, 41.0, 41.0, 25.0, 29.0, 26.0, 25.0, 29.0, 34.0, 16.0, 22.0, 19.0, 21.0, 18.0, 16.0, 16.0, 17.0, 9.0, 7.0, 14.0, 8.0, 13.0, 8.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.55859375, -6.32904052734375, -6.0994873046875, -5.86993408203125, -5.640380859375, -5.41082763671875, -5.1812744140625, -4.95172119140625, -4.72216796875, -4.49261474609375, -4.2630615234375, -4.03350830078125, -3.803955078125, -3.57440185546875, -3.3448486328125, -3.11529541015625, -2.8857421875, -2.65618896484375, -2.4266357421875, -2.19708251953125, -1.967529296875, -1.73797607421875, -1.5084228515625, -1.27886962890625, -1.04931640625, -0.81976318359375, -0.5902099609375, -0.36065673828125, -0.131103515625, 0.09844970703125, 0.3280029296875, 0.55755615234375, 0.787109375, 1.01666259765625, 1.2462158203125, 1.47576904296875, 1.705322265625, 1.93487548828125, 2.1644287109375, 2.39398193359375, 2.62353515625, 2.85308837890625, 3.0826416015625, 3.31219482421875, 3.541748046875, 3.77130126953125, 4.0008544921875, 4.23040771484375, 4.4599609375, 4.68951416015625, 4.9190673828125, 5.14862060546875, 5.378173828125, 5.60772705078125, 5.8372802734375, 6.06683349609375, 6.29638671875, 6.52593994140625, 6.7554931640625, 6.98504638671875, 7.214599609375, 7.44415283203125, 7.6737060546875, 7.90325927734375, 8.1328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 5.0, 10.0, 14.0, 14.0, 33.0, 37.0, 41.0, 88.0, 132.0, 201.0, 366.0, 649.0, 1205.0, 2573.0, 6377.0, 18987.0, 76188.0, 464428.0, 385414.0, 64237.0, 16767.0, 5757.0, 2407.0, 1157.0, 628.0, 288.0, 209.0, 112.0, 68.0, 48.0, 41.0, 11.0, 17.0, 18.0, 5.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.431640625, -1.3868255615234375, -1.342010498046875, -1.2971954345703125, -1.25238037109375, -1.2075653076171875, -1.162750244140625, -1.1179351806640625, -1.0731201171875, -1.0283050537109375, -0.983489990234375, -0.9386749267578125, -0.89385986328125, -0.8490447998046875, -0.804229736328125, -0.7594146728515625, -0.714599609375, -0.6697845458984375, -0.624969482421875, -0.5801544189453125, -0.53533935546875, -0.4905242919921875, -0.445709228515625, -0.4008941650390625, -0.3560791015625, -0.3112640380859375, -0.266448974609375, -0.2216339111328125, -0.17681884765625, -0.1320037841796875, -0.087188720703125, -0.0423736572265625, 0.00244140625, 0.0472564697265625, 0.092071533203125, 0.1368865966796875, 0.18170166015625, 0.2265167236328125, 0.271331787109375, 0.3161468505859375, 0.3609619140625, 0.4057769775390625, 0.450592041015625, 0.4954071044921875, 0.54022216796875, 0.5850372314453125, 0.629852294921875, 0.6746673583984375, 0.719482421875, 0.7642974853515625, 0.809112548828125, 0.8539276123046875, 0.89874267578125, 0.9435577392578125, 0.988372802734375, 1.0331878662109375, 1.0780029296875, 1.1228179931640625, 1.167633056640625, 1.2124481201171875, 1.25726318359375, 1.3020782470703125, 1.346893310546875, 1.3917083740234375, 1.4365234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 3.0, 3.0, 13.0, 13.0, 14.0, 21.0, 29.0, 34.0, 59.0, 68.0, 130.0, 149.0, 132.0, 99.0, 54.0, 45.0, 33.0, 27.0, 20.0, 14.0, 11.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00038170814514160156, -0.00037253648042678833, -0.0003633648157119751, -0.00035419315099716187, -0.00034502148628234863, -0.0003358498215675354, -0.00032667815685272217, -0.00031750649213790894, -0.0003083348274230957, -0.00029916316270828247, -0.00028999149799346924, -0.000280819833278656, -0.0002716481685638428, -0.00026247650384902954, -0.0002533048391342163, -0.00024413317441940308, -0.00023496150970458984, -0.0002257898449897766, -0.00021661818027496338, -0.00020744651556015015, -0.00019827485084533691, -0.00018910318613052368, -0.00017993152141571045, -0.00017075985670089722, -0.00016158819198608398, -0.00015241652727127075, -0.00014324486255645752, -0.0001340731978416443, -0.00012490153312683105, -0.00011572986841201782, -0.00010655820369720459, -9.738653898239136e-05, -8.821487426757812e-05, -7.904320955276489e-05, -6.987154483795166e-05, -6.069988012313843e-05, -5.1528215408325195e-05, -4.235655069351196e-05, -3.318488597869873e-05, -2.4013221263885498e-05, -1.4841556549072266e-05, -5.669891834259033e-06, 3.5017728805541992e-06, 1.2673437595367432e-05, 2.1845102310180664e-05, 3.1016767024993896e-05, 4.018843173980713e-05, 4.936009645462036e-05, 5.8531761169433594e-05, 6.770342588424683e-05, 7.687509059906006e-05, 8.604675531387329e-05, 9.521842002868652e-05, 0.00010439008474349976, 0.00011356174945831299, 0.00012273341417312622, 0.00013190507888793945, 0.00014107674360275269, 0.00015024840831756592, 0.00015942007303237915, 0.00016859173774719238, 0.00017776340246200562, 0.00018693506717681885, 0.00019610673189163208, 0.0002052783966064453]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 9.0, 1.0, 9.0, 13.0, 14.0, 24.0, 23.0, 38.0, 72.0, 112.0, 192.0, 299.0, 610.0, 1276.0, 2851.0, 7168.0, 21804.0, 81037.0, 463672.0, 372739.0, 66759.0, 18569.0, 6239.0, 2567.0, 1133.0, 544.0, 313.0, 167.0, 106.0, 62.0, 42.0, 34.0, 21.0, 13.0, 11.0, 4.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12890625, -1.079681396484375, -1.03045654296875, -0.981231689453125, -0.9320068359375, -0.882781982421875, -0.83355712890625, -0.784332275390625, -0.735107421875, -0.685882568359375, -0.63665771484375, -0.587432861328125, -0.5382080078125, -0.488983154296875, -0.43975830078125, -0.390533447265625, -0.34130859375, -0.292083740234375, -0.24285888671875, -0.193634033203125, -0.1444091796875, -0.095184326171875, -0.04595947265625, 0.003265380859375, 0.052490234375, 0.101715087890625, 0.15093994140625, 0.200164794921875, 0.2493896484375, 0.298614501953125, 0.34783935546875, 0.397064208984375, 0.4462890625, 0.495513916015625, 0.54473876953125, 0.593963623046875, 0.6431884765625, 0.692413330078125, 0.74163818359375, 0.790863037109375, 0.840087890625, 0.889312744140625, 0.93853759765625, 0.987762451171875, 1.0369873046875, 1.086212158203125, 1.13543701171875, 1.184661865234375, 1.23388671875, 1.283111572265625, 1.33233642578125, 1.381561279296875, 1.4307861328125, 1.480010986328125, 1.52923583984375, 1.578460693359375, 1.627685546875, 1.676910400390625, 1.72613525390625, 1.775360107421875, 1.8245849609375, 1.873809814453125, 1.92303466796875, 1.972259521484375, 2.021484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 6.0, 2.0, 4.0, 6.0, 5.0, 8.0, 15.0, 17.0, 20.0, 29.0, 25.0, 43.0, 52.0, 64.0, 91.0, 106.0, 113.0, 89.0, 64.0, 61.0, 50.0, 21.0, 21.0, 17.0, 20.0, 10.0, 12.0, 9.0, 4.0, 6.0, 5.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.931640625, -0.9070281982421875, -0.882415771484375, -0.8578033447265625, -0.83319091796875, -0.8085784912109375, -0.783966064453125, -0.7593536376953125, -0.7347412109375, -0.7101287841796875, -0.685516357421875, -0.6609039306640625, -0.63629150390625, -0.6116790771484375, -0.587066650390625, -0.5624542236328125, -0.537841796875, -0.5132293701171875, -0.488616943359375, -0.4640045166015625, -0.43939208984375, -0.4147796630859375, -0.390167236328125, -0.3655548095703125, -0.3409423828125, -0.3163299560546875, -0.291717529296875, -0.2671051025390625, -0.24249267578125, -0.2178802490234375, -0.193267822265625, -0.1686553955078125, -0.14404296875, -0.1194305419921875, -0.094818115234375, -0.0702056884765625, -0.04559326171875, -0.0209808349609375, 0.003631591796875, 0.0282440185546875, 0.0528564453125, 0.0774688720703125, 0.102081298828125, 0.1266937255859375, 0.15130615234375, 0.1759185791015625, 0.200531005859375, 0.2251434326171875, 0.249755859375, 0.2743682861328125, 0.298980712890625, 0.3235931396484375, 0.34820556640625, 0.3728179931640625, 0.397430419921875, 0.4220428466796875, 0.4466552734375, 0.4712677001953125, 0.495880126953125, 0.5204925537109375, 0.54510498046875, 0.5697174072265625, 0.594329833984375, 0.6189422607421875, 0.6435546875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 15.0, 40.0, 68.0, 103.0, 180.0, 191.0, 187.0, 91.0, 58.0, 26.0, 17.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.85233497619629, -24.03775405883789, -23.22317123413086, -22.40859031677246, -21.59400749206543, -20.77942657470703, -19.96484375, -19.1502628326416, -18.33568000793457, -17.521099090576172, -16.70651626586914, -15.891934394836426, -15.077352523803711, -14.262771606445312, -13.448188781738281, -12.633607864379883, -11.819025993347168, -11.004444122314453, -10.189862251281738, -9.375280380249023, -8.560698509216309, -7.746117115020752, -6.931535243988037, -6.116953372955322, -5.302371501922607, -4.487789630889893, -3.6732077598571777, -2.858626127243042, -2.044044256210327, -1.2294626235961914, -0.41488075256347656, 0.3997011184692383, 1.2142829895019531, 2.028864860534668, 2.843446731567383, 3.6580283641815186, 4.4726104736328125, 5.287191867828369, 6.101773738861084, 6.916355609893799, 7.730937480926514, 8.54551887512207, 9.360100746154785, 10.1746826171875, 10.989264488220215, 11.80384635925293, 12.618428230285645, 13.43301010131836, 14.247591972351074, 15.062173843383789, 15.876755714416504, 16.69133758544922, 17.505918502807617, 18.32050132751465, 19.135082244873047, 19.949665069580078, 20.764245986938477, 21.578826904296875, 22.393409729003906, 23.207990646362305, 24.022573471069336, 24.837154388427734, 25.651737213134766, 26.466318130493164, 27.280900955200195]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 1.0, 7.0, 15.0, 20.0, 24.0, 24.0, 24.0, 18.0, 19.0, 25.0, 29.0, 38.0, 31.0, 52.0, 50.0, 35.0, 49.0, 43.0, 41.0, 41.0, 37.0, 44.0, 27.0, 35.0, 29.0, 33.0, 33.0, 27.0, 20.0, 19.0, 16.0, 17.0, 10.0, 12.0, 13.0, 9.0, 8.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.63160228729248, -12.160292625427246, -11.688982963562012, -11.217673301696777, -10.746363639831543, -10.275053977966309, -9.803743362426758, -9.332433700561523, -8.861124038696289, -8.389814376831055, -7.91850471496582, -7.447195053100586, -6.975885391235352, -6.504575729370117, -6.033265590667725, -5.56195592880249, -5.090646743774414, -4.61933708190918, -4.148027420043945, -3.676717519760132, -3.2054078578948975, -2.734098196029663, -2.2627882957458496, -1.7914786338806152, -1.3201689720153809, -0.8488592505455017, -0.37754952907562256, 0.09376025199890137, 0.5650699138641357, 1.0363795757293701, 1.5076894760131836, 1.978999137878418, 2.4503097534179688, 2.921619415283203, 3.3929290771484375, 3.864238977432251, 4.335548400878906, 4.806858062744141, 5.278168201446533, 5.749477863311768, 6.220787525177002, 6.692097187042236, 7.163406848907471, 7.634716987609863, 8.106026649475098, 8.577336311340332, 9.048645973205566, 9.5199556350708, 9.991265296936035, 10.46257495880127, 10.933884620666504, 11.405194282531738, 11.876503944396973, 12.347813606262207, 12.819124221801758, 13.290433883666992, 13.761743545532227, 14.233053207397461, 14.704362869262695, 15.17567253112793, 15.646982192993164, 16.1182918548584, 16.589601516723633, 17.060911178588867, 17.5322208404541]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 10.0, 7.0, 9.0, 10.0, 11.0, 18.0, 30.0, 36.0, 38.0, 44.0, 71.0, 112.0, 169.0, 278.0, 443.0, 852.0, 1880.0, 4561.0, 12651.0, 56587.0, 545609.0, 3040500.0, 464109.0, 47053.0, 11418.0, 3945.0, 1734.0, 820.0, 464.0, 258.0, 163.0, 108.0, 79.0, 47.0, 43.0, 22.0, 17.0, 16.0, 9.0, 12.0, 12.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.510498046875, -8.20068359375, -7.890869140625, -7.5810546875, -7.271240234375, -6.96142578125, -6.651611328125, -6.341796875, -6.031982421875, -5.72216796875, -5.412353515625, -5.1025390625, -4.792724609375, -4.48291015625, -4.173095703125, -3.86328125, -3.553466796875, -3.24365234375, -2.933837890625, -2.6240234375, -2.314208984375, -2.00439453125, -1.694580078125, -1.384765625, -1.074951171875, -0.76513671875, -0.455322265625, -0.1455078125, 0.164306640625, 0.47412109375, 0.783935546875, 1.09375, 1.403564453125, 1.71337890625, 2.023193359375, 2.3330078125, 2.642822265625, 2.95263671875, 3.262451171875, 3.572265625, 3.882080078125, 4.19189453125, 4.501708984375, 4.8115234375, 5.121337890625, 5.43115234375, 5.740966796875, 6.05078125, 6.360595703125, 6.67041015625, 6.980224609375, 7.2900390625, 7.599853515625, 7.90966796875, 8.219482421875, 8.529296875, 8.839111328125, 9.14892578125, 9.458740234375, 9.7685546875, 10.078369140625, 10.38818359375, 10.697998046875, 11.0078125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 13.0, 14.0, 28.0, 38.0, 28.0, 38.0, 39.0, 65.0, 74.0, 69.0, 63.0, 76.0, 81.0, 63.0, 56.0, 38.0, 43.0, 40.0, 22.0, 22.0, 20.0, 18.0, 13.0, 5.0, 10.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2109375, -6.96533203125, -6.7197265625, -6.47412109375, -6.228515625, -5.98291015625, -5.7373046875, -5.49169921875, -5.24609375, -5.00048828125, -4.7548828125, -4.50927734375, -4.263671875, -4.01806640625, -3.7724609375, -3.52685546875, -3.28125, -3.03564453125, -2.7900390625, -2.54443359375, -2.298828125, -2.05322265625, -1.8076171875, -1.56201171875, -1.31640625, -1.07080078125, -0.8251953125, -0.57958984375, -0.333984375, -0.08837890625, 0.1572265625, 0.40283203125, 0.6484375, 0.89404296875, 1.1396484375, 1.38525390625, 1.630859375, 1.87646484375, 2.1220703125, 2.36767578125, 2.61328125, 2.85888671875, 3.1044921875, 3.35009765625, 3.595703125, 3.84130859375, 4.0869140625, 4.33251953125, 4.578125, 4.82373046875, 5.0693359375, 5.31494140625, 5.560546875, 5.80615234375, 6.0517578125, 6.29736328125, 6.54296875, 6.78857421875, 7.0341796875, 7.27978515625, 7.525390625, 7.77099609375, 8.0166015625, 8.26220703125, 8.5078125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 8.0, 4.0, 11.0, 31.0, 60.0, 105.0, 252.0, 853.0, 10362.0, 3910388.0, 268017.0, 3212.0, 576.0, 190.0, 88.0, 53.0, 19.0, 14.0, 10.0, 9.0, 10.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-43.28125, -42.3154296875, -41.349609375, -40.3837890625, -39.41796875, -38.4521484375, -37.486328125, -36.5205078125, -35.5546875, -34.5888671875, -33.623046875, -32.6572265625, -31.69140625, -30.7255859375, -29.759765625, -28.7939453125, -27.828125, -26.8623046875, -25.896484375, -24.9306640625, -23.96484375, -22.9990234375, -22.033203125, -21.0673828125, -20.1015625, -19.1357421875, -18.169921875, -17.2041015625, -16.23828125, -15.2724609375, -14.306640625, -13.3408203125, -12.375, -11.4091796875, -10.443359375, -9.4775390625, -8.51171875, -7.5458984375, -6.580078125, -5.6142578125, -4.6484375, -3.6826171875, -2.716796875, -1.7509765625, -0.78515625, 0.1806640625, 1.146484375, 2.1123046875, 3.078125, 4.0439453125, 5.009765625, 5.9755859375, 6.94140625, 7.9072265625, 8.873046875, 9.8388671875, 10.8046875, 11.7705078125, 12.736328125, 13.7021484375, 14.66796875, 15.6337890625, 16.599609375, 17.5654296875, 18.53125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 2.0, 3.0, 7.0, 11.0, 8.0, 6.0, 23.0, 23.0, 28.0, 41.0, 53.0, 72.0, 103.0, 146.0, 235.0, 415.0, 621.0, 669.0, 553.0, 366.0, 226.0, 117.0, 96.0, 73.0, 46.0, 30.0, 28.0, 19.0, 15.0, 10.0, 7.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.439453125, -2.36407470703125, -2.2886962890625, -2.21331787109375, -2.137939453125, -2.06256103515625, -1.9871826171875, -1.91180419921875, -1.83642578125, -1.76104736328125, -1.6856689453125, -1.61029052734375, -1.534912109375, -1.45953369140625, -1.3841552734375, -1.30877685546875, -1.2333984375, -1.15802001953125, -1.0826416015625, -1.00726318359375, -0.931884765625, -0.85650634765625, -0.7811279296875, -0.70574951171875, -0.63037109375, -0.55499267578125, -0.4796142578125, -0.40423583984375, -0.328857421875, -0.25347900390625, -0.1781005859375, -0.10272216796875, -0.02734375, 0.04803466796875, 0.1234130859375, 0.19879150390625, 0.274169921875, 0.34954833984375, 0.4249267578125, 0.50030517578125, 0.57568359375, 0.65106201171875, 0.7264404296875, 0.80181884765625, 0.877197265625, 0.95257568359375, 1.0279541015625, 1.10333251953125, 1.1787109375, 1.25408935546875, 1.3294677734375, 1.40484619140625, 1.480224609375, 1.55560302734375, 1.6309814453125, 1.70635986328125, 1.78173828125, 1.85711669921875, 1.9324951171875, 2.00787353515625, 2.083251953125, 2.15863037109375, 2.2340087890625, 2.30938720703125, 2.384765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 7.0, 7.0, 13.0, 26.0, 40.0, 74.0, 87.0, 141.0, 171.0, 153.0, 118.0, 69.0, 48.0, 19.0, 17.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.299962043762207, -6.768779277801514, -6.23759651184082, -5.706414222717285, -5.175231456756592, -4.644048690795898, -4.112866401672363, -3.58168363571167, -3.0505008697509766, -2.519318103790283, -1.988135576248169, -1.4569529294967651, -0.9257702827453613, -0.39458751678466797, 0.1365950107574463, 0.6677775382995605, 1.198960304260254, 1.7301429510116577, 2.2613255977630615, 2.792508125305176, 3.323690891265869, 3.8548736572265625, 4.386055946350098, 4.917238712310791, 5.448421478271484, 5.979604244232178, 6.510787010192871, 7.041969299316406, 7.5731520652771, 8.104334831237793, 8.635517120361328, 9.16670036315918, 9.697881698608398, 10.229063987731934, 10.760247230529785, 11.29142951965332, 11.822612762451172, 12.353795051574707, 12.884977340698242, 13.416160583496094, 13.947342872619629, 14.478525161743164, 15.009708404541016, 15.54089069366455, 16.072072982788086, 16.603256225585938, 17.13443946838379, 17.665620803833008, 18.19680404663086, 18.72798728942871, 19.25916862487793, 19.79035186767578, 20.321535110473633, 20.852718353271484, 21.383899688720703, 21.915082931518555, 22.446266174316406, 22.977449417114258, 23.508630752563477, 24.039813995361328, 24.57099723815918, 25.10218048095703, 25.63336181640625, 26.1645450592041, 26.69572639465332]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 13.0, 14.0, 22.0, 25.0, 32.0, 32.0, 44.0, 61.0, 70.0, 62.0, 54.0, 60.0, 67.0, 60.0, 63.0, 56.0, 48.0, 45.0, 31.0, 38.0, 26.0, 16.0, 13.0, 14.0, 8.0, 4.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.333297729492188, -8.063886642456055, -7.7944746017456055, -7.5250630378723145, -7.255651473999023, -6.986239910125732, -6.716828346252441, -6.44741678237915, -6.178005218505859, -5.908593654632568, -5.639182090759277, -5.369770526885986, -5.100358963012695, -4.830947399139404, -4.561535835266113, -4.292124271392822, -4.022712707519531, -3.7533011436462402, -3.483889579772949, -3.214478015899658, -2.945066452026367, -2.675654888153076, -2.406243324279785, -2.136831760406494, -1.8674201965332031, -1.598008632659912, -1.328597068786621, -1.05918550491333, -0.7897739410400391, -0.520362377166748, -0.25095081329345703, 0.018460750579833984, 0.2878713607788086, 0.5572829246520996, 0.8266944885253906, 1.0961060523986816, 1.3655176162719727, 1.6349291801452637, 1.9043407440185547, 2.1737523078918457, 2.4431638717651367, 2.7125754356384277, 2.9819869995117188, 3.2513985633850098, 3.520810127258301, 3.790221691131592, 4.059633255004883, 4.329044818878174, 4.598456382751465, 4.867867946624756, 5.137279510498047, 5.406691074371338, 5.676102638244629, 5.94551420211792, 6.214925765991211, 6.484337329864502, 6.753748893737793, 7.023160457611084, 7.292572021484375, 7.561983585357666, 7.831395149230957, 8.100807189941406, 8.370218276977539, 8.639629364013672, 8.909041404724121]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 12.0, 9.0, 31.0, 42.0, 116.0, 188.0, 365.0, 749.0, 1710.0, 3889.0, 9678.0, 27898.0, 121484.0, 602505.0, 217107.0, 40629.0, 12915.0, 5126.0, 2111.0, 1024.0, 458.0, 235.0, 121.0, 62.0, 35.0, 16.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7578125, -2.680450439453125, -2.60308837890625, -2.525726318359375, -2.4483642578125, -2.371002197265625, -2.29364013671875, -2.216278076171875, -2.138916015625, -2.061553955078125, -1.98419189453125, -1.906829833984375, -1.8294677734375, -1.752105712890625, -1.67474365234375, -1.597381591796875, -1.52001953125, -1.442657470703125, -1.36529541015625, -1.287933349609375, -1.2105712890625, -1.133209228515625, -1.05584716796875, -0.978485107421875, -0.901123046875, -0.823760986328125, -0.74639892578125, -0.669036865234375, -0.5916748046875, -0.514312744140625, -0.43695068359375, -0.359588623046875, -0.2822265625, -0.204864501953125, -0.12750244140625, -0.050140380859375, 0.0272216796875, 0.104583740234375, 0.18194580078125, 0.259307861328125, 0.336669921875, 0.414031982421875, 0.49139404296875, 0.568756103515625, 0.6461181640625, 0.723480224609375, 0.80084228515625, 0.878204345703125, 0.95556640625, 1.032928466796875, 1.11029052734375, 1.187652587890625, 1.2650146484375, 1.342376708984375, 1.41973876953125, 1.497100830078125, 1.574462890625, 1.651824951171875, 1.72918701171875, 1.806549072265625, 1.8839111328125, 1.961273193359375, 2.03863525390625, 2.115997314453125, 2.193359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 5.0, 6.0, 19.0, 18.0, 34.0, 32.0, 36.0, 57.0, 49.0, 90.0, 76.0, 73.0, 62.0, 64.0, 68.0, 66.0, 62.0, 40.0, 29.0, 37.0, 27.0, 17.0, 8.0, 9.0, 8.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.203125, -5.004638671875, -4.80615234375, -4.607666015625, -4.4091796875, -4.210693359375, -4.01220703125, -3.813720703125, -3.615234375, -3.416748046875, -3.21826171875, -3.019775390625, -2.8212890625, -2.622802734375, -2.42431640625, -2.225830078125, -2.02734375, -1.828857421875, -1.63037109375, -1.431884765625, -1.2333984375, -1.034912109375, -0.83642578125, -0.637939453125, -0.439453125, -0.240966796875, -0.04248046875, 0.156005859375, 0.3544921875, 0.552978515625, 0.75146484375, 0.949951171875, 1.1484375, 1.346923828125, 1.54541015625, 1.743896484375, 1.9423828125, 2.140869140625, 2.33935546875, 2.537841796875, 2.736328125, 2.934814453125, 3.13330078125, 3.331787109375, 3.5302734375, 3.728759765625, 3.92724609375, 4.125732421875, 4.32421875, 4.522705078125, 4.72119140625, 4.919677734375, 5.1181640625, 5.316650390625, 5.51513671875, 5.713623046875, 5.912109375, 6.110595703125, 6.30908203125, 6.507568359375, 6.7060546875, 6.904541015625, 7.10302734375, 7.301513671875, 7.5]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 8.0, 3.0, 9.0, 10.0, 15.0, 30.0, 38.0, 77.0, 124.0, 283.0, 550.0, 1324.0, 3802.0, 11766.0, 52987.0, 525195.0, 396463.0, 40535.0, 9761.0, 3230.0, 1254.0, 528.0, 224.0, 126.0, 66.0, 38.0, 22.0, 10.0, 18.0, 13.0, 7.0, 5.0, 5.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.25, -3.156951904296875, -3.06390380859375, -2.970855712890625, -2.8778076171875, -2.784759521484375, -2.69171142578125, -2.598663330078125, -2.505615234375, -2.412567138671875, -2.31951904296875, -2.226470947265625, -2.1334228515625, -2.040374755859375, -1.94732666015625, -1.854278564453125, -1.76123046875, -1.668182373046875, -1.57513427734375, -1.482086181640625, -1.3890380859375, -1.295989990234375, -1.20294189453125, -1.109893798828125, -1.016845703125, -0.923797607421875, -0.83074951171875, -0.737701416015625, -0.6446533203125, -0.551605224609375, -0.45855712890625, -0.365509033203125, -0.2724609375, -0.179412841796875, -0.08636474609375, 0.006683349609375, 0.0997314453125, 0.192779541015625, 0.28582763671875, 0.378875732421875, 0.471923828125, 0.564971923828125, 0.65802001953125, 0.751068115234375, 0.8441162109375, 0.937164306640625, 1.03021240234375, 1.123260498046875, 1.21630859375, 1.309356689453125, 1.40240478515625, 1.495452880859375, 1.5885009765625, 1.681549072265625, 1.77459716796875, 1.867645263671875, 1.960693359375, 2.053741455078125, 2.14678955078125, 2.239837646484375, 2.3328857421875, 2.425933837890625, 2.51898193359375, 2.612030029296875, 2.705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 5.0, 5.0, 15.0, 7.0, 11.0, 18.0, 18.0, 16.0, 15.0, 27.0, 30.0, 40.0, 33.0, 30.0, 33.0, 36.0, 52.0, 47.0, 37.0, 56.0, 43.0, 43.0, 47.0, 49.0, 40.0, 44.0, 35.0, 27.0, 27.0, 16.0, 20.0, 16.0, 11.0, 16.0, 14.0, 10.0, 6.0, 0.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3125, -8.0380859375, -7.763671875, -7.4892578125, -7.21484375, -6.9404296875, -6.666015625, -6.3916015625, -6.1171875, -5.8427734375, -5.568359375, -5.2939453125, -5.01953125, -4.7451171875, -4.470703125, -4.1962890625, -3.921875, -3.6474609375, -3.373046875, -3.0986328125, -2.82421875, -2.5498046875, -2.275390625, -2.0009765625, -1.7265625, -1.4521484375, -1.177734375, -0.9033203125, -0.62890625, -0.3544921875, -0.080078125, 0.1943359375, 0.46875, 0.7431640625, 1.017578125, 1.2919921875, 1.56640625, 1.8408203125, 2.115234375, 2.3896484375, 2.6640625, 2.9384765625, 3.212890625, 3.4873046875, 3.76171875, 4.0361328125, 4.310546875, 4.5849609375, 4.859375, 5.1337890625, 5.408203125, 5.6826171875, 5.95703125, 6.2314453125, 6.505859375, 6.7802734375, 7.0546875, 7.3291015625, 7.603515625, 7.8779296875, 8.15234375, 8.4267578125, 8.701171875, 8.9755859375, 9.25]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 8.0, 11.0, 20.0, 22.0, 21.0, 38.0, 42.0, 69.0, 102.0, 162.0, 263.0, 473.0, 863.0, 1851.0, 4242.0, 12673.0, 54448.0, 416927.0, 472910.0, 60767.0, 13839.0, 4605.0, 1937.0, 952.0, 518.0, 294.0, 137.0, 118.0, 70.0, 42.0, 41.0, 23.0, 14.0, 9.0, 5.0, 2.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.177734375, -1.145050048828125, -1.11236572265625, -1.079681396484375, -1.0469970703125, -1.014312744140625, -0.98162841796875, -0.948944091796875, -0.916259765625, -0.883575439453125, -0.85089111328125, -0.818206787109375, -0.7855224609375, -0.752838134765625, -0.72015380859375, -0.687469482421875, -0.65478515625, -0.622100830078125, -0.58941650390625, -0.556732177734375, -0.5240478515625, -0.491363525390625, -0.45867919921875, -0.425994873046875, -0.393310546875, -0.360626220703125, -0.32794189453125, -0.295257568359375, -0.2625732421875, -0.229888916015625, -0.19720458984375, -0.164520263671875, -0.1318359375, -0.099151611328125, -0.06646728515625, -0.033782958984375, -0.0010986328125, 0.031585693359375, 0.06427001953125, 0.096954345703125, 0.129638671875, 0.162322998046875, 0.19500732421875, 0.227691650390625, 0.2603759765625, 0.293060302734375, 0.32574462890625, 0.358428955078125, 0.39111328125, 0.423797607421875, 0.45648193359375, 0.489166259765625, 0.5218505859375, 0.554534912109375, 0.58721923828125, 0.619903564453125, 0.652587890625, 0.685272216796875, 0.71795654296875, 0.750640869140625, 0.7833251953125, 0.816009521484375, 0.84869384765625, 0.881378173828125, 0.9140625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 4.0, 9.0, 12.0, 7.0, 16.0, 54.0, 68.0, 97.0, 135.0, 180.0, 157.0, 96.0, 72.0, 40.0, 18.0, 14.0, 9.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005178451538085938, -0.0004976168274879456, -0.00047738850116729736, -0.00045716017484664917, -0.000436931848526001, -0.0004167035222053528, -0.0003964751958847046, -0.0003762468695640564, -0.0003560185432434082, -0.00033579021692276, -0.0003155618906021118, -0.0002953335642814636, -0.00027510523796081543, -0.00025487691164016724, -0.00023464858531951904, -0.00021442025899887085, -0.00019419193267822266, -0.00017396360635757446, -0.00015373528003692627, -0.00013350695371627808, -0.00011327862739562988, -9.305030107498169e-05, -7.28219747543335e-05, -5.25936484336853e-05, -3.236532211303711e-05, -1.2136995792388916e-05, 8.091330528259277e-06, 2.831965684890747e-05, 4.8547983169555664e-05, 6.877630949020386e-05, 8.900463581085205e-05, 0.00010923296213150024, 0.00012946128845214844, 0.00014968961477279663, 0.00016991794109344482, 0.00019014626741409302, 0.0002103745937347412, 0.0002306029200553894, 0.0002508312463760376, 0.0002710595726966858, 0.000291287899017334, 0.0003115162253379822, 0.00033174455165863037, 0.00035197287797927856, 0.00037220120429992676, 0.00039242953062057495, 0.00041265785694122314, 0.00043288618326187134, 0.00045311450958251953, 0.0004733428359031677, 0.0004935711622238159, 0.0005137994885444641, 0.0005340278148651123, 0.0005542561411857605, 0.0005744844675064087, 0.0005947127938270569, 0.0006149411201477051, 0.0006351694464683533, 0.0006553977727890015, 0.0006756260991096497, 0.0006958544254302979, 0.000716082751750946, 0.0007363110780715942, 0.0007565394043922424, 0.0007767677307128906]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 7.0, 4.0, 3.0, 9.0, 14.0, 18.0, 27.0, 33.0, 65.0, 105.0, 146.0, 273.0, 493.0, 917.0, 1841.0, 3853.0, 10534.0, 46450.0, 367521.0, 527414.0, 66233.0, 13584.0, 4587.0, 2067.0, 1019.0, 578.0, 307.0, 169.0, 86.0, 73.0, 45.0, 25.0, 16.0, 15.0, 11.0, 11.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.205078125, -1.17169189453125, -1.1383056640625, -1.10491943359375, -1.071533203125, -1.03814697265625, -1.0047607421875, -0.97137451171875, -0.93798828125, -0.90460205078125, -0.8712158203125, -0.83782958984375, -0.804443359375, -0.77105712890625, -0.7376708984375, -0.70428466796875, -0.6708984375, -0.63751220703125, -0.6041259765625, -0.57073974609375, -0.537353515625, -0.50396728515625, -0.4705810546875, -0.43719482421875, -0.40380859375, -0.37042236328125, -0.3370361328125, -0.30364990234375, -0.270263671875, -0.23687744140625, -0.2034912109375, -0.17010498046875, -0.13671875, -0.10333251953125, -0.0699462890625, -0.03656005859375, -0.003173828125, 0.03021240234375, 0.0635986328125, 0.09698486328125, 0.13037109375, 0.16375732421875, 0.1971435546875, 0.23052978515625, 0.263916015625, 0.29730224609375, 0.3306884765625, 0.36407470703125, 0.3974609375, 0.43084716796875, 0.4642333984375, 0.49761962890625, 0.531005859375, 0.56439208984375, 0.5977783203125, 0.63116455078125, 0.66455078125, 0.69793701171875, 0.7313232421875, 0.76470947265625, 0.798095703125, 0.83148193359375, 0.8648681640625, 0.89825439453125, 0.931640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 6.0, 5.0, 13.0, 20.0, 25.0, 41.0, 56.0, 91.0, 112.0, 150.0, 135.0, 112.0, 75.0, 49.0, 40.0, 25.0, 14.0, 7.0, 10.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30712890625, -0.2980155944824219, -0.28890228271484375, -0.2797889709472656, -0.2706756591796875, -0.2615623474121094, -0.25244903564453125, -0.24333572387695312, -0.234222412109375, -0.22510910034179688, -0.21599578857421875, -0.20688247680664062, -0.1977691650390625, -0.18865585327148438, -0.17954254150390625, -0.17042922973632812, -0.16131591796875, -0.15220260620117188, -0.14308929443359375, -0.13397598266601562, -0.1248626708984375, -0.11574935913085938, -0.10663604736328125, -0.09752273559570312, -0.088409423828125, -0.07929611206054688, -0.07018280029296875, -0.061069488525390625, -0.0519561767578125, -0.042842864990234375, -0.03372955322265625, -0.024616241455078125, -0.0155029296875, -0.006389617919921875, 0.00272369384765625, 0.011837005615234375, 0.0209503173828125, 0.030063629150390625, 0.03917694091796875, 0.048290252685546875, 0.057403564453125, 0.06651687622070312, 0.07563018798828125, 0.08474349975585938, 0.0938568115234375, 0.10297012329101562, 0.11208343505859375, 0.12119674682617188, 0.13031005859375, 0.13942337036132812, 0.14853668212890625, 0.15764999389648438, 0.1667633056640625, 0.17587661743164062, 0.18498992919921875, 0.19410324096679688, 0.203216552734375, 0.21232986450195312, 0.22144317626953125, 0.23055648803710938, 0.2396697998046875, 0.24878311157226562, 0.25789642333984375, 0.2670097351074219, 0.276123046875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 10.0, 21.0, 39.0, 55.0, 115.0, 157.0, 224.0, 175.0, 94.0, 55.0, 29.0, 11.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.488933086395264, -5.083921909332275, -4.678911209106445, -4.273900032043457, -3.868889331817627, -3.4638781547546387, -3.0588672161102295, -2.6538562774658203, -2.248845338821411, -1.843834400177002, -1.4388234615325928, -1.033812403678894, -0.6288014650344849, -0.22379040718078613, 0.18122053146362305, 0.5862314701080322, 0.9912424087524414, 1.3962533473968506, 1.8012642860412598, 2.206275463104248, 2.611286163330078, 3.0162973403930664, 3.4213082790374756, 3.8263192176818848, 4.231329917907715, 4.636341094970703, 5.041351795196533, 5.4463629722595215, 5.851373672485352, 6.25638484954834, 6.661396026611328, 7.066406726837158, 7.471417427062988, 7.876428604125977, 8.281439781188965, 8.686450004577637, 9.091461181640625, 9.496472358703613, 9.901483535766602, 10.306493759155273, 10.711504936218262, 11.11651611328125, 11.521527290344238, 11.92653751373291, 12.331548690795898, 12.736559867858887, 13.141571044921875, 13.546581268310547, 13.951593399047852, 14.35660457611084, 14.761615753173828, 15.1666259765625, 15.571637153625488, 15.976648330688477, 16.38165855407715, 16.786670684814453, 17.191680908203125, 17.596691131591797, 18.0017032623291, 18.406713485717773, 18.811725616455078, 19.21673583984375, 19.621746063232422, 20.026758193969727, 20.4317684173584]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 2.0, 5.0, 11.0, 7.0, 9.0, 26.0, 34.0, 37.0, 35.0, 51.0, 63.0, 71.0, 73.0, 64.0, 60.0, 68.0, 67.0, 63.0, 51.0, 46.0, 43.0, 27.0, 34.0, 9.0, 16.0, 12.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3008198738098145, -5.121241569519043, -4.9416632652282715, -4.7620849609375, -4.58250617980957, -4.402927875518799, -4.223349571228027, -4.043771266937256, -3.8641929626464844, -3.684614658355713, -3.5050363540649414, -3.325457811355591, -3.1458795070648193, -2.966301202774048, -2.7867226600646973, -2.607144355773926, -2.4275660514831543, -2.247987747192383, -2.0684094429016113, -1.8888309001922607, -1.7092525959014893, -1.5296742916107178, -1.3500958681106567, -1.1705174446105957, -0.9909391403198242, -0.811360776424408, -0.6317824125289917, -0.45220404863357544, -0.2726256847381592, -0.09304732084274292, 0.08653104305267334, 0.2661094665527344, 0.44568729400634766, 0.6252656579017639, 0.8048440217971802, 0.9844223856925964, 1.1640007495880127, 1.3435790538787842, 1.5231574773788452, 1.7027359008789062, 1.8823142051696777, 2.061892509460449, 2.2414708137512207, 2.4210493564605713, 2.6006276607513428, 2.7802059650421143, 2.959784507751465, 3.1393628120422363, 3.318941116333008, 3.4985194206237793, 3.678097724914551, 3.8576762676239014, 4.037254333496094, 4.216833114624023, 4.396411418914795, 4.575989723205566, 4.755568027496338, 4.935146331787109, 5.114724636077881, 5.294302940368652, 5.473881721496582, 5.6534600257873535, 5.833038330078125, 6.0126166343688965, 6.192194938659668]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 1.0, 8.0, 6.0, 16.0, 12.0, 39.0, 73.0, 189.0, 676.0, 3007.0, 25392.0, 908994.0, 101551.0, 6866.0, 1224.0, 290.0, 99.0, 37.0, 19.0, 14.0, 11.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.875, -14.390625, -13.90625, -13.421875, -12.9375, -12.453125, -11.96875, -11.484375, -11.0, -10.515625, -10.03125, -9.546875, -9.0625, -8.578125, -8.09375, -7.609375, -7.125, -6.640625, -6.15625, -5.671875, -5.1875, -4.703125, -4.21875, -3.734375, -3.25, -2.765625, -2.28125, -1.796875, -1.3125, -0.828125, -0.34375, 0.140625, 0.625, 1.109375, 1.59375, 2.078125, 2.5625, 3.046875, 3.53125, 4.015625, 4.5, 4.984375, 5.46875, 5.953125, 6.4375, 6.921875, 7.40625, 7.890625, 8.375, 8.859375, 9.34375, 9.828125, 10.3125, 10.796875, 11.28125, 11.765625, 12.25, 12.734375, 13.21875, 13.703125, 14.1875, 14.671875, 15.15625, 15.640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 5.0, 5.0, 4.0, 14.0, 20.0, 19.0, 20.0, 31.0, 32.0, 43.0, 37.0, 38.0, 44.0, 55.0, 60.0, 59.0, 57.0, 48.0, 62.0, 46.0, 49.0, 35.0, 31.0, 28.0, 34.0, 20.0, 21.0, 18.0, 10.0, 13.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.260498046875, -7.94287109375, -7.625244140625, -7.3076171875, -6.989990234375, -6.67236328125, -6.354736328125, -6.037109375, -5.719482421875, -5.40185546875, -5.084228515625, -4.7666015625, -4.448974609375, -4.13134765625, -3.813720703125, -3.49609375, -3.178466796875, -2.86083984375, -2.543212890625, -2.2255859375, -1.907958984375, -1.59033203125, -1.272705078125, -0.955078125, -0.637451171875, -0.31982421875, -0.002197265625, 0.3154296875, 0.633056640625, 0.95068359375, 1.268310546875, 1.5859375, 1.903564453125, 2.22119140625, 2.538818359375, 2.8564453125, 3.174072265625, 3.49169921875, 3.809326171875, 4.126953125, 4.444580078125, 4.76220703125, 5.079833984375, 5.3974609375, 5.715087890625, 6.03271484375, 6.350341796875, 6.66796875, 6.985595703125, 7.30322265625, 7.620849609375, 7.9384765625, 8.256103515625, 8.57373046875, 8.891357421875, 9.208984375, 9.526611328125, 9.84423828125, 10.161865234375, 10.4794921875, 10.797119140625, 11.11474609375, 11.432373046875, 11.75]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 10.0, 10.0, 20.0, 15.0, 33.0, 43.0, 43.0, 44.0, 86.0, 115.0, 205.0, 339.0, 552.0, 964.0, 1761.0, 3723.0, 8752.0, 25747.0, 140137.0, 696985.0, 128013.0, 24828.0, 8420.0, 3607.0, 1766.0, 887.0, 506.0, 281.0, 211.0, 131.0, 82.0, 56.0, 29.0, 26.0, 23.0, 24.0, 18.0, 12.0, 9.0, 4.0, 4.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.609375, -4.4581298828125, -4.306884765625, -4.1556396484375, -4.00439453125, -3.8531494140625, -3.701904296875, -3.5506591796875, -3.3994140625, -3.2481689453125, -3.096923828125, -2.9456787109375, -2.79443359375, -2.6431884765625, -2.491943359375, -2.3406982421875, -2.189453125, -2.0382080078125, -1.886962890625, -1.7357177734375, -1.58447265625, -1.4332275390625, -1.281982421875, -1.1307373046875, -0.9794921875, -0.8282470703125, -0.677001953125, -0.5257568359375, -0.37451171875, -0.2232666015625, -0.072021484375, 0.0792236328125, 0.23046875, 0.3817138671875, 0.532958984375, 0.6842041015625, 0.83544921875, 0.9866943359375, 1.137939453125, 1.2891845703125, 1.4404296875, 1.5916748046875, 1.742919921875, 1.8941650390625, 2.04541015625, 2.1966552734375, 2.347900390625, 2.4991455078125, 2.650390625, 2.8016357421875, 2.952880859375, 3.1041259765625, 3.25537109375, 3.4066162109375, 3.557861328125, 3.7091064453125, 3.8603515625, 4.0115966796875, 4.162841796875, 4.3140869140625, 4.46533203125, 4.6165771484375, 4.767822265625, 4.9190673828125, 5.0703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 3.0, 7.0, 6.0, 9.0, 9.0, 12.0, 10.0, 16.0, 13.0, 13.0, 25.0, 19.0, 20.0, 20.0, 22.0, 29.0, 26.0, 33.0, 34.0, 51.0, 33.0, 29.0, 45.0, 37.0, 43.0, 38.0, 33.0, 42.0, 38.0, 39.0, 23.0, 19.0, 26.0, 23.0, 26.0, 28.0, 9.0, 14.0, 14.0, 12.0, 12.0, 9.0, 4.0, 9.0, 7.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.046875, -8.768310546875, -8.48974609375, -8.211181640625, -7.9326171875, -7.654052734375, -7.37548828125, -7.096923828125, -6.818359375, -6.539794921875, -6.26123046875, -5.982666015625, -5.7041015625, -5.425537109375, -5.14697265625, -4.868408203125, -4.58984375, -4.311279296875, -4.03271484375, -3.754150390625, -3.4755859375, -3.197021484375, -2.91845703125, -2.639892578125, -2.361328125, -2.082763671875, -1.80419921875, -1.525634765625, -1.2470703125, -0.968505859375, -0.68994140625, -0.411376953125, -0.1328125, 0.145751953125, 0.42431640625, 0.702880859375, 0.9814453125, 1.260009765625, 1.53857421875, 1.817138671875, 2.095703125, 2.374267578125, 2.65283203125, 2.931396484375, 3.2099609375, 3.488525390625, 3.76708984375, 4.045654296875, 4.32421875, 4.602783203125, 4.88134765625, 5.159912109375, 5.4384765625, 5.717041015625, 5.99560546875, 6.274169921875, 6.552734375, 6.831298828125, 7.10986328125, 7.388427734375, 7.6669921875, 7.945556640625, 8.22412109375, 8.502685546875, 8.78125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 4.0, 12.0, 9.0, 13.0, 42.0, 47.0, 90.0, 138.0, 288.0, 633.0, 1660.0, 5198.0, 22008.0, 181083.0, 734766.0, 83538.0, 13308.0, 3452.0, 1214.0, 509.0, 207.0, 116.0, 58.0, 47.0, 39.0, 20.0, 11.0, 5.0, 4.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8681640625, -1.8137664794921875, -1.759368896484375, -1.7049713134765625, -1.65057373046875, -1.5961761474609375, -1.541778564453125, -1.4873809814453125, -1.4329833984375, -1.3785858154296875, -1.324188232421875, -1.2697906494140625, -1.21539306640625, -1.1609954833984375, -1.106597900390625, -1.0522003173828125, -0.997802734375, -0.9434051513671875, -0.889007568359375, -0.8346099853515625, -0.78021240234375, -0.7258148193359375, -0.671417236328125, -0.6170196533203125, -0.5626220703125, -0.5082244873046875, -0.453826904296875, -0.3994293212890625, -0.34503173828125, -0.2906341552734375, -0.236236572265625, -0.1818389892578125, -0.12744140625, -0.0730438232421875, -0.018646240234375, 0.0357513427734375, 0.09014892578125, 0.1445465087890625, 0.198944091796875, 0.2533416748046875, 0.3077392578125, 0.3621368408203125, 0.416534423828125, 0.4709320068359375, 0.52532958984375, 0.5797271728515625, 0.634124755859375, 0.6885223388671875, 0.742919921875, 0.7973175048828125, 0.851715087890625, 0.9061126708984375, 0.96051025390625, 1.0149078369140625, 1.069305419921875, 1.1237030029296875, 1.1781005859375, 1.2324981689453125, 1.286895751953125, 1.3412933349609375, 1.39569091796875, 1.4500885009765625, 1.504486083984375, 1.5588836669921875, 1.61328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 10.0, 10.0, 10.0, 20.0, 24.0, 54.0, 52.0, 68.0, 78.0, 134.0, 121.0, 107.0, 86.0, 43.0, 34.0, 23.0, 26.0, 14.0, 14.0, 14.0, 11.0, 5.0, 2.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00021791458129882812, -0.00021111778914928436, -0.0002043209969997406, -0.00019752420485019684, -0.00019072741270065308, -0.00018393062055110931, -0.00017713382840156555, -0.0001703370362520218, -0.00016354024410247803, -0.00015674345195293427, -0.0001499466598033905, -0.00014314986765384674, -0.00013635307550430298, -0.00012955628335475922, -0.00012275949120521545, -0.00011596269905567169, -0.00010916590690612793, -0.00010236911475658417, -9.55723226070404e-05, -8.877553045749664e-05, -8.197873830795288e-05, -7.518194615840912e-05, -6.838515400886536e-05, -6.15883618593216e-05, -5.479156970977783e-05, -4.799477756023407e-05, -4.119798541069031e-05, -3.4401193261146545e-05, -2.7604401111602783e-05, -2.080760896205902e-05, -1.4010816812515259e-05, -7.214024662971497e-06, -4.172325134277344e-07, 6.379559636116028e-06, 1.317635178565979e-05, 1.9973143935203552e-05, 2.6769936084747314e-05, 3.356672823429108e-05, 4.036352038383484e-05, 4.71603125333786e-05, 5.395710468292236e-05, 6.0753896832466125e-05, 6.755068898200989e-05, 7.434748113155365e-05, 8.114427328109741e-05, 8.794106543064117e-05, 9.473785758018494e-05, 0.0001015346497297287, 0.00010833144187927246, 0.00011512823402881622, 0.00012192502617835999, 0.00012872181832790375, 0.0001355186104774475, 0.00014231540262699127, 0.00014911219477653503, 0.0001559089869260788, 0.00016270577907562256, 0.00016950257122516632, 0.00017629936337471008, 0.00018309615552425385, 0.0001898929476737976, 0.00019668973982334137, 0.00020348653197288513, 0.0002102833241224289, 0.00021708011627197266]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 7.0, 15.0, 21.0, 12.0, 26.0, 56.0, 112.0, 202.0, 388.0, 828.0, 2201.0, 6532.0, 27012.0, 200285.0, 699816.0, 88072.0, 15625.0, 4411.0, 1552.0, 641.0, 329.0, 169.0, 90.0, 46.0, 32.0, 31.0, 14.0, 8.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8837890625, -1.8289031982421875, -1.774017333984375, -1.7191314697265625, -1.66424560546875, -1.6093597412109375, -1.554473876953125, -1.4995880126953125, -1.4447021484375, -1.3898162841796875, -1.334930419921875, -1.2800445556640625, -1.22515869140625, -1.1702728271484375, -1.115386962890625, -1.0605010986328125, -1.005615234375, -0.9507293701171875, -0.895843505859375, -0.8409576416015625, -0.78607177734375, -0.7311859130859375, -0.676300048828125, -0.6214141845703125, -0.5665283203125, -0.5116424560546875, -0.456756591796875, -0.4018707275390625, -0.34698486328125, -0.2920989990234375, -0.237213134765625, -0.1823272705078125, -0.12744140625, -0.0725555419921875, -0.017669677734375, 0.0372161865234375, 0.09210205078125, 0.1469879150390625, 0.201873779296875, 0.2567596435546875, 0.3116455078125, 0.3665313720703125, 0.421417236328125, 0.4763031005859375, 0.53118896484375, 0.5860748291015625, 0.640960693359375, 0.6958465576171875, 0.750732421875, 0.8056182861328125, 0.860504150390625, 0.9153900146484375, 0.97027587890625, 1.0251617431640625, 1.080047607421875, 1.1349334716796875, 1.1898193359375, 1.2447052001953125, 1.299591064453125, 1.3544769287109375, 1.40936279296875, 1.4642486572265625, 1.519134521484375, 1.5740203857421875, 1.62890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 7.0, 7.0, 10.0, 16.0, 19.0, 37.0, 52.0, 56.0, 106.0, 143.0, 165.0, 107.0, 64.0, 61.0, 37.0, 31.0, 25.0, 11.0, 9.0, 4.0, 8.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.822265625, -0.791015625, -0.759765625, -0.728515625, -0.697265625, -0.666015625, -0.634765625, -0.603515625, -0.572265625, -0.541015625, -0.509765625, -0.478515625, -0.447265625, -0.416015625, -0.384765625, -0.353515625, -0.322265625, -0.291015625, -0.259765625, -0.228515625, -0.197265625, -0.166015625, -0.134765625, -0.103515625, -0.072265625, -0.041015625, -0.009765625, 0.021484375, 0.052734375, 0.083984375, 0.115234375, 0.146484375, 0.177734375, 0.208984375, 0.240234375, 0.271484375, 0.302734375, 0.333984375, 0.365234375, 0.396484375, 0.427734375, 0.458984375, 0.490234375, 0.521484375, 0.552734375, 0.583984375, 0.615234375, 0.646484375, 0.677734375, 0.708984375, 0.740234375, 0.771484375, 0.802734375, 0.833984375, 0.865234375, 0.896484375, 0.927734375, 0.958984375, 0.990234375, 1.021484375, 1.052734375, 1.083984375, 1.115234375, 1.146484375, 1.177734375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 48.0, 177.0, 395.0, 289.0, 66.0, 21.0, 8.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.83898162841797, -38.08824920654297, -36.33751678466797, -34.5867805480957, -32.8360481262207, -31.085315704345703, -29.33458137512207, -27.583847045898438, -25.833114624023438, -24.082382202148438, -22.331647872924805, -20.580913543701172, -18.830181121826172, -17.079448699951172, -15.328714370727539, -13.577980995178223, -11.827247619628906, -10.07651424407959, -8.325780868530273, -6.575047492980957, -4.824314117431641, -3.073580741882324, -1.3228473663330078, 0.4278860092163086, 2.178619384765625, 3.9293527603149414, 5.680086135864258, 7.430819511413574, 9.18155288696289, 10.932286262512207, 12.683019638061523, 14.43375301361084, 16.184486389160156, 17.935218811035156, 19.68595314025879, 21.436687469482422, 23.187419891357422, 24.938152313232422, 26.688886642456055, 28.439620971679688, 30.190353393554688, 31.941085815429688, 33.69181823730469, 35.44255447387695, 37.19328689575195, 38.94401931762695, 40.69475555419922, 42.44548797607422, 44.19622039794922, 45.94695281982422, 47.69768524169922, 49.448421478271484, 51.199153900146484, 52.949886322021484, 54.70062255859375, 56.45135498046875, 58.20208740234375, 59.95281982421875, 61.70355224609375, 63.454288482666016, 65.20501708984375, 66.95575714111328, 68.70648956298828, 70.45722198486328, 72.20795440673828]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 12.0, 7.0, 13.0, 19.0, 12.0, 16.0, 25.0, 20.0, 23.0, 31.0, 31.0, 41.0, 37.0, 50.0, 45.0, 42.0, 55.0, 48.0, 34.0, 52.0, 41.0, 50.0, 38.0, 34.0, 44.0, 28.0, 28.0, 17.0, 19.0, 21.0, 14.0, 8.0, 11.0, 11.0, 6.0, 4.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.167110443115234, -16.581321716308594, -15.99553108215332, -15.40974235534668, -14.823952674865723, -14.238162994384766, -13.652373313903809, -13.066583633422852, -12.480794906616211, -11.895005226135254, -11.309215545654297, -10.723426818847656, -10.1376371383667, -9.551847457885742, -8.966057777404785, -8.380268096923828, -7.794478416442871, -7.208688735961914, -6.622899532318115, -6.037109851837158, -5.451320648193359, -4.865530967712402, -4.279741287231445, -3.6939520835876465, -3.1081624031066895, -2.5223729610443115, -1.936583399772644, -1.3507938385009766, -0.7650043964385986, -0.1792149543762207, 0.40657472610473633, 0.9923639297485352, 1.5781536102294922, 2.16394305229187, 2.749732494354248, 3.335522174835205, 3.921311616897583, 4.507101058959961, 5.092890739440918, 5.678679943084717, 6.264469623565674, 6.850259304046631, 7.43604850769043, 8.021838188171387, 8.607627868652344, 9.193416595458984, 9.779207229614258, 10.364995956420898, 10.950785636901855, 11.536575317382812, 12.12236499786377, 12.708154678344727, 13.293943405151367, 13.879733085632324, 14.465522766113281, 15.051311492919922, 15.637102127075195, 16.222890853881836, 16.80868148803711, 17.39447021484375, 17.980260848999023, 18.566049575805664, 19.151840209960938, 19.737628936767578, 20.32341766357422]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 2.0, 4.0, 7.0, 9.0, 13.0, 19.0, 22.0, 40.0, 63.0, 96.0, 156.0, 249.0, 416.0, 582.0, 1087.0, 2149.0, 4541.0, 10570.0, 32650.0, 149573.0, 1326510.0, 2315506.0, 275737.0, 48533.0, 14387.0, 5622.0, 2582.0, 1223.0, 731.0, 440.0, 278.0, 145.0, 113.0, 67.0, 52.0, 36.0, 24.0, 12.0, 14.0, 7.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6640625, -5.4388427734375, -5.213623046875, -4.9884033203125, -4.76318359375, -4.5379638671875, -4.312744140625, -4.0875244140625, -3.8623046875, -3.6370849609375, -3.411865234375, -3.1866455078125, -2.96142578125, -2.7362060546875, -2.510986328125, -2.2857666015625, -2.060546875, -1.8353271484375, -1.610107421875, -1.3848876953125, -1.15966796875, -0.9344482421875, -0.709228515625, -0.4840087890625, -0.2587890625, -0.0335693359375, 0.191650390625, 0.4168701171875, 0.64208984375, 0.8673095703125, 1.092529296875, 1.3177490234375, 1.54296875, 1.7681884765625, 1.993408203125, 2.2186279296875, 2.44384765625, 2.6690673828125, 2.894287109375, 3.1195068359375, 3.3447265625, 3.5699462890625, 3.795166015625, 4.0203857421875, 4.24560546875, 4.4708251953125, 4.696044921875, 4.9212646484375, 5.146484375, 5.3717041015625, 5.596923828125, 5.8221435546875, 6.04736328125, 6.2725830078125, 6.497802734375, 6.7230224609375, 6.9482421875, 7.1734619140625, 7.398681640625, 7.6239013671875, 7.84912109375, 8.0743408203125, 8.299560546875, 8.5247802734375, 8.75]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 3.0, 4.0, 11.0, 3.0, 14.0, 24.0, 19.0, 29.0, 43.0, 53.0, 58.0, 82.0, 70.0, 82.0, 85.0, 73.0, 78.0, 50.0, 59.0, 47.0, 21.0, 31.0, 19.0, 10.0, 12.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.13702392578125, -7.8990478515625, -7.66107177734375, -7.423095703125, -7.18511962890625, -6.9471435546875, -6.70916748046875, -6.47119140625, -6.23321533203125, -5.9952392578125, -5.75726318359375, -5.519287109375, -5.28131103515625, -5.0433349609375, -4.80535888671875, -4.5673828125, -4.32940673828125, -4.0914306640625, -3.85345458984375, -3.615478515625, -3.37750244140625, -3.1395263671875, -2.90155029296875, -2.66357421875, -2.42559814453125, -2.1876220703125, -1.94964599609375, -1.711669921875, -1.47369384765625, -1.2357177734375, -0.99774169921875, -0.759765625, -0.52178955078125, -0.2838134765625, -0.04583740234375, 0.192138671875, 0.43011474609375, 0.6680908203125, 0.90606689453125, 1.14404296875, 1.38201904296875, 1.6199951171875, 1.85797119140625, 2.095947265625, 2.33392333984375, 2.5718994140625, 2.80987548828125, 3.0478515625, 3.28582763671875, 3.5238037109375, 3.76177978515625, 3.999755859375, 4.23773193359375, 4.4757080078125, 4.71368408203125, 4.95166015625, 5.18963623046875, 5.4276123046875, 5.66558837890625, 5.903564453125, 6.14154052734375, 6.3795166015625, 6.61749267578125, 6.85546875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 9.0, 12.0, 14.0, 19.0, 23.0, 34.0, 42.0, 89.0, 112.0, 286.0, 581.0, 1468.0, 4606.0, 22773.0, 235000.0, 3626288.0, 270127.0, 24990.0, 5031.0, 1517.0, 568.0, 276.0, 159.0, 70.0, 56.0, 37.0, 22.0, 21.0, 9.0, 11.0, 9.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0], "bins": [-13.1015625, -12.79345703125, -12.4853515625, -12.17724609375, -11.869140625, -11.56103515625, -11.2529296875, -10.94482421875, -10.63671875, -10.32861328125, -10.0205078125, -9.71240234375, -9.404296875, -9.09619140625, -8.7880859375, -8.47998046875, -8.171875, -7.86376953125, -7.5556640625, -7.24755859375, -6.939453125, -6.63134765625, -6.3232421875, -6.01513671875, -5.70703125, -5.39892578125, -5.0908203125, -4.78271484375, -4.474609375, -4.16650390625, -3.8583984375, -3.55029296875, -3.2421875, -2.93408203125, -2.6259765625, -2.31787109375, -2.009765625, -1.70166015625, -1.3935546875, -1.08544921875, -0.77734375, -0.46923828125, -0.1611328125, 0.14697265625, 0.455078125, 0.76318359375, 1.0712890625, 1.37939453125, 1.6875, 1.99560546875, 2.3037109375, 2.61181640625, 2.919921875, 3.22802734375, 3.5361328125, 3.84423828125, 4.15234375, 4.46044921875, 4.7685546875, 5.07666015625, 5.384765625, 5.69287109375, 6.0009765625, 6.30908203125, 6.6171875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 3.0, 7.0, 9.0, 16.0, 19.0, 29.0, 27.0, 50.0, 59.0, 92.0, 147.0, 249.0, 393.0, 591.0, 688.0, 580.0, 363.0, 247.0, 135.0, 113.0, 59.0, 59.0, 41.0, 25.0, 20.0, 11.0, 12.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8505859375, -1.7808990478515625, -1.711212158203125, -1.6415252685546875, -1.57183837890625, -1.5021514892578125, -1.432464599609375, -1.3627777099609375, -1.2930908203125, -1.2234039306640625, -1.153717041015625, -1.0840301513671875, -1.01434326171875, -0.9446563720703125, -0.874969482421875, -0.8052825927734375, -0.735595703125, -0.6659088134765625, -0.596221923828125, -0.5265350341796875, -0.45684814453125, -0.3871612548828125, -0.317474365234375, -0.2477874755859375, -0.1781005859375, -0.1084136962890625, -0.038726806640625, 0.0309600830078125, 0.10064697265625, 0.1703338623046875, 0.240020751953125, 0.3097076416015625, 0.37939453125, 0.4490814208984375, 0.518768310546875, 0.5884552001953125, 0.65814208984375, 0.7278289794921875, 0.797515869140625, 0.8672027587890625, 0.9368896484375, 1.0065765380859375, 1.076263427734375, 1.1459503173828125, 1.21563720703125, 1.2853240966796875, 1.355010986328125, 1.4246978759765625, 1.494384765625, 1.5640716552734375, 1.633758544921875, 1.7034454345703125, 1.77313232421875, 1.8428192138671875, 1.912506103515625, 1.9821929931640625, 2.0518798828125, 2.1215667724609375, 2.191253662109375, 2.2609405517578125, 2.33062744140625, 2.4003143310546875, 2.470001220703125, 2.5396881103515625, 2.609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 9.0, 14.0, 23.0, 31.0, 95.0, 147.0, 196.0, 217.0, 129.0, 74.0, 26.0, 21.0, 12.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.957261085510254, -6.37431001663208, -5.7913594245910645, -5.208408355712891, -4.625457763671875, -4.042506694793701, -3.4595556259155273, -2.8766050338745117, -2.293653964996338, -1.7107031345367432, -1.1277521848678589, -0.5448012351989746, 0.03814959526062012, 0.6211004257202148, 1.2040514945983887, 1.7870020866394043, 2.369953155517578, 2.952903985977173, 3.5358548164367676, 4.118805885314941, 4.701756477355957, 5.284707546234131, 5.867658615112305, 6.45060920715332, 7.033560276031494, 7.616511344909668, 8.199461936950684, 8.782413482666016, 9.365364074707031, 9.948314666748047, 10.531265258789062, 11.114215850830078, 11.697168350219727, 12.280118942260742, 12.863070487976074, 13.44602108001709, 14.028971672058105, 14.611923217773438, 15.194873809814453, 15.777824401855469, 16.360774993896484, 16.9437255859375, 17.526676177978516, 18.10962677001953, 18.69257926940918, 19.275529861450195, 19.85848045349121, 20.441431045532227, 21.024383544921875, 21.60733413696289, 22.190284729003906, 22.773235321044922, 23.35618782043457, 23.939138412475586, 24.5220890045166, 25.105039596557617, 25.687990188598633, 26.27094078063965, 26.853891372680664, 27.436843872070312, 28.019794464111328, 28.602745056152344, 29.18569564819336, 29.768646240234375, 30.35159683227539]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 11.0, 17.0, 28.0, 20.0, 41.0, 47.0, 55.0, 66.0, 79.0, 86.0, 82.0, 69.0, 76.0, 57.0, 58.0, 45.0, 32.0, 37.0, 19.0, 18.0, 14.0, 9.0, 11.0, 8.0, 0.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.815110206604004, -9.547473907470703, -9.279837608337402, -9.012201309204102, -8.744564056396484, -8.476927757263184, -8.209291458129883, -7.941655158996582, -7.674018859863281, -7.4063825607299805, -7.1387457847595215, -6.871109485626221, -6.60347318649292, -6.335836410522461, -6.06820011138916, -5.800563812255859, -5.5329270362854, -5.2652907371521, -4.997653961181641, -4.73001766204834, -4.462381362915039, -4.194745063781738, -3.9271082878112793, -3.6594719886779785, -3.3918354511260986, -3.1241989135742188, -2.856562614440918, -2.588926076889038, -2.321289539337158, -2.0536532402038574, -1.7860167026519775, -1.5183802843093872, -1.2507438659667969, -0.9831074476242065, -0.7154709696769714, -0.44783449172973633, -0.180198073387146, 0.08743834495544434, 0.3550748825073242, 0.6227113008499146, 0.8903477191925049, 1.1579841375350952, 1.4256205558776855, 1.6932570934295654, 1.9608935117721558, 2.228529930114746, 2.496166467666626, 2.763803005218506, 3.0314393043518066, 3.2990758419036865, 3.5667121410369873, 3.834348678588867, 4.101984977722168, 4.369621276855469, 4.637258052825928, 4.9048943519592285, 5.1725311279296875, 5.440167427062988, 5.707804203033447, 5.975440502166748, 6.243076801300049, 6.510713577270508, 6.778349876403809, 7.045986175537109, 7.31362247467041]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 14.0, 17.0, 26.0, 35.0, 76.0, 149.0, 317.0, 612.0, 1350.0, 3429.0, 9776.0, 33207.0, 153376.0, 555861.0, 225012.0, 45063.0, 12692.0, 4380.0, 1703.0, 745.0, 320.0, 141.0, 94.0, 49.0, 34.0, 22.0, 8.0, 10.0, 8.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9298858642578125, -1.872467041015625, -1.8150482177734375, -1.75762939453125, -1.7002105712890625, -1.642791748046875, -1.5853729248046875, -1.5279541015625, -1.4705352783203125, -1.413116455078125, -1.3556976318359375, -1.29827880859375, -1.2408599853515625, -1.183441162109375, -1.1260223388671875, -1.068603515625, -1.0111846923828125, -0.953765869140625, -0.8963470458984375, -0.83892822265625, -0.7815093994140625, -0.724090576171875, -0.6666717529296875, -0.6092529296875, -0.5518341064453125, -0.494415283203125, -0.4369964599609375, -0.37957763671875, -0.3221588134765625, -0.264739990234375, -0.2073211669921875, -0.14990234375, -0.0924835205078125, -0.035064697265625, 0.0223541259765625, 0.07977294921875, 0.1371917724609375, 0.194610595703125, 0.2520294189453125, 0.3094482421875, 0.3668670654296875, 0.424285888671875, 0.4817047119140625, 0.53912353515625, 0.5965423583984375, 0.653961181640625, 0.7113800048828125, 0.768798828125, 0.8262176513671875, 0.883636474609375, 0.9410552978515625, 0.99847412109375, 1.0558929443359375, 1.113311767578125, 1.1707305908203125, 1.2281494140625, 1.2855682373046875, 1.342987060546875, 1.4004058837890625, 1.45782470703125, 1.5152435302734375, 1.572662353515625, 1.6300811767578125, 1.6875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 5.0, 7.0, 5.0, 7.0, 8.0, 16.0, 22.0, 28.0, 38.0, 40.0, 59.0, 73.0, 82.0, 78.0, 73.0, 71.0, 83.0, 58.0, 62.0, 46.0, 26.0, 27.0, 19.0, 19.0, 14.0, 8.0, 12.0, 9.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.83203125, -5.6678466796875, -5.503662109375, -5.3394775390625, -5.17529296875, -5.0111083984375, -4.846923828125, -4.6827392578125, -4.5185546875, -4.3543701171875, -4.190185546875, -4.0260009765625, -3.86181640625, -3.6976318359375, -3.533447265625, -3.3692626953125, -3.205078125, -3.0408935546875, -2.876708984375, -2.7125244140625, -2.54833984375, -2.3841552734375, -2.219970703125, -2.0557861328125, -1.8916015625, -1.7274169921875, -1.563232421875, -1.3990478515625, -1.23486328125, -1.0706787109375, -0.906494140625, -0.7423095703125, -0.578125, -0.4139404296875, -0.249755859375, -0.0855712890625, 0.07861328125, 0.2427978515625, 0.406982421875, 0.5711669921875, 0.7353515625, 0.8995361328125, 1.063720703125, 1.2279052734375, 1.39208984375, 1.5562744140625, 1.720458984375, 1.8846435546875, 2.048828125, 2.2130126953125, 2.377197265625, 2.5413818359375, 2.70556640625, 2.8697509765625, 3.033935546875, 3.1981201171875, 3.3623046875, 3.5264892578125, 3.690673828125, 3.8548583984375, 4.01904296875, 4.1832275390625, 4.347412109375, 4.5115966796875, 4.67578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 13.0, 12.0, 14.0, 23.0, 14.0, 48.0, 51.0, 92.0, 95.0, 179.0, 275.0, 474.0, 815.0, 1487.0, 2906.0, 6127.0, 14327.0, 36377.0, 109493.0, 342788.0, 353051.0, 114361.0, 37917.0, 14656.0, 6304.0, 2960.0, 1518.0, 815.0, 506.0, 303.0, 176.0, 101.0, 70.0, 50.0, 34.0, 25.0, 27.0, 13.0, 8.0, 6.0, 13.0, 7.0, 4.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2919921875, -1.2528533935546875, -1.213714599609375, -1.1745758056640625, -1.13543701171875, -1.0962982177734375, -1.057159423828125, -1.0180206298828125, -0.9788818359375, -0.9397430419921875, -0.900604248046875, -0.8614654541015625, -0.82232666015625, -0.7831878662109375, -0.744049072265625, -0.7049102783203125, -0.665771484375, -0.6266326904296875, -0.587493896484375, -0.5483551025390625, -0.50921630859375, -0.4700775146484375, -0.430938720703125, -0.3917999267578125, -0.3526611328125, -0.3135223388671875, -0.274383544921875, -0.2352447509765625, -0.19610595703125, -0.1569671630859375, -0.117828369140625, -0.0786895751953125, -0.03955078125, -0.0004119873046875, 0.038726806640625, 0.0778656005859375, 0.11700439453125, 0.1561431884765625, 0.195281982421875, 0.2344207763671875, 0.2735595703125, 0.3126983642578125, 0.351837158203125, 0.3909759521484375, 0.43011474609375, 0.4692535400390625, 0.508392333984375, 0.5475311279296875, 0.586669921875, 0.6258087158203125, 0.664947509765625, 0.7040863037109375, 0.74322509765625, 0.7823638916015625, 0.821502685546875, 0.8606414794921875, 0.8997802734375, 0.9389190673828125, 0.978057861328125, 1.0171966552734375, 1.05633544921875, 1.0954742431640625, 1.134613037109375, 1.1737518310546875, 1.212890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 3.0, 8.0, 8.0, 10.0, 16.0, 23.0, 20.0, 19.0, 29.0, 40.0, 27.0, 19.0, 35.0, 43.0, 50.0, 58.0, 53.0, 54.0, 48.0, 51.0, 34.0, 53.0, 43.0, 32.0, 32.0, 27.0, 33.0, 29.0, 14.0, 21.0, 11.0, 7.0, 10.0, 3.0, 13.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.2421875, -7.0162353515625, -6.790283203125, -6.5643310546875, -6.33837890625, -6.1124267578125, -5.886474609375, -5.6605224609375, -5.4345703125, -5.2086181640625, -4.982666015625, -4.7567138671875, -4.53076171875, -4.3048095703125, -4.078857421875, -3.8529052734375, -3.626953125, -3.4010009765625, -3.175048828125, -2.9490966796875, -2.72314453125, -2.4971923828125, -2.271240234375, -2.0452880859375, -1.8193359375, -1.5933837890625, -1.367431640625, -1.1414794921875, -0.91552734375, -0.6895751953125, -0.463623046875, -0.2376708984375, -0.01171875, 0.2142333984375, 0.440185546875, 0.6661376953125, 0.89208984375, 1.1180419921875, 1.343994140625, 1.5699462890625, 1.7958984375, 2.0218505859375, 2.247802734375, 2.4737548828125, 2.69970703125, 2.9256591796875, 3.151611328125, 3.3775634765625, 3.603515625, 3.8294677734375, 4.055419921875, 4.2813720703125, 4.50732421875, 4.7332763671875, 4.959228515625, 5.1851806640625, 5.4111328125, 5.6370849609375, 5.863037109375, 6.0889892578125, 6.31494140625, 6.5408935546875, 6.766845703125, 6.9927978515625, 7.21875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 10.0, 8.0, 13.0, 20.0, 19.0, 32.0, 49.0, 64.0, 85.0, 138.0, 254.0, 426.0, 922.0, 2030.0, 4959.0, 14855.0, 55744.0, 275244.0, 534131.0, 117098.0, 28111.0, 8440.0, 3082.0, 1279.0, 633.0, 355.0, 156.0, 110.0, 86.0, 57.0, 35.0, 22.0, 23.0, 15.0, 4.0, 7.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.69970703125, -0.6773147583007812, -0.6549224853515625, -0.6325302124023438, -0.610137939453125, -0.5877456665039062, -0.5653533935546875, -0.5429611206054688, -0.52056884765625, -0.49817657470703125, -0.4757843017578125, -0.45339202880859375, -0.430999755859375, -0.40860748291015625, -0.3862152099609375, -0.36382293701171875, -0.3414306640625, -0.31903839111328125, -0.2966461181640625, -0.27425384521484375, -0.251861572265625, -0.22946929931640625, -0.2070770263671875, -0.18468475341796875, -0.16229248046875, -0.13990020751953125, -0.1175079345703125, -0.09511566162109375, -0.072723388671875, -0.05033111572265625, -0.0279388427734375, -0.00554656982421875, 0.016845703125, 0.03923797607421875, 0.0616302490234375, 0.08402252197265625, 0.106414794921875, 0.12880706787109375, 0.1511993408203125, 0.17359161376953125, 0.19598388671875, 0.21837615966796875, 0.2407684326171875, 0.26316070556640625, 0.285552978515625, 0.30794525146484375, 0.3303375244140625, 0.35272979736328125, 0.3751220703125, 0.39751434326171875, 0.4199066162109375, 0.44229888916015625, 0.464691162109375, 0.48708343505859375, 0.5094757080078125, 0.5318679809570312, 0.55426025390625, 0.5766525268554688, 0.5990447998046875, 0.6214370727539062, 0.643829345703125, 0.6662216186523438, 0.6886138916015625, 0.7110061645507812, 0.7333984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 9.0, 11.0, 9.0, 15.0, 16.0, 19.0, 29.0, 31.0, 43.0, 71.0, 91.0, 89.0, 114.0, 93.0, 78.0, 70.0, 60.0, 45.0, 27.0, 11.0, 20.0, 12.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002536773681640625, -0.00024364516139030457, -0.00023361295461654663, -0.0002235807478427887, -0.00021354854106903076, -0.00020351633429527283, -0.0001934841275215149, -0.00018345192074775696, -0.00017341971397399902, -0.0001633875072002411, -0.00015335530042648315, -0.00014332309365272522, -0.00013329088687896729, -0.00012325868010520935, -0.00011322647333145142, -0.00010319426655769348, -9.316205978393555e-05, -8.312985301017761e-05, -7.309764623641968e-05, -6.306543946266174e-05, -5.303323268890381e-05, -4.3001025915145874e-05, -3.296881914138794e-05, -2.2936612367630005e-05, -1.290440559387207e-05, -2.8721988201141357e-06, 7.160007953643799e-06, 1.7192214727401733e-05, 2.7224421501159668e-05, 3.72566282749176e-05, 4.728883504867554e-05, 5.732104182243347e-05, 6.73532485961914e-05, 7.738545536994934e-05, 8.741766214370728e-05, 9.744986891746521e-05, 0.00010748207569122314, 0.00011751428246498108, 0.00012754648923873901, 0.00013757869601249695, 0.00014761090278625488, 0.00015764310956001282, 0.00016767531633377075, 0.0001777075231075287, 0.00018773972988128662, 0.00019777193665504456, 0.0002078041434288025, 0.00021783635020256042, 0.00022786855697631836, 0.0002379007637500763, 0.00024793297052383423, 0.00025796517729759216, 0.0002679973840713501, 0.00027802959084510803, 0.00028806179761886597, 0.0002980940043926239, 0.00030812621116638184, 0.00031815841794013977, 0.0003281906247138977, 0.00033822283148765564, 0.0003482550382614136, 0.0003582872450351715, 0.00036831945180892944, 0.0003783516585826874, 0.0003883838653564453]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 13.0, 10.0, 7.0, 10.0, 17.0, 22.0, 25.0, 60.0, 88.0, 107.0, 199.0, 377.0, 735.0, 1535.0, 3965.0, 11700.0, 41051.0, 172096.0, 537301.0, 209036.0, 48591.0, 13495.0, 4530.0, 1746.0, 779.0, 388.0, 256.0, 153.0, 90.0, 48.0, 30.0, 15.0, 15.0, 14.0, 6.0, 5.0, 6.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.69482421875, -0.6747207641601562, -0.6546173095703125, -0.6345138549804688, -0.614410400390625, -0.5943069458007812, -0.5742034912109375, -0.5541000366210938, -0.53399658203125, -0.5138931274414062, -0.4937896728515625, -0.47368621826171875, -0.453582763671875, -0.43347930908203125, -0.4133758544921875, -0.39327239990234375, -0.3731689453125, -0.35306549072265625, -0.3329620361328125, -0.31285858154296875, -0.292755126953125, -0.27265167236328125, -0.2525482177734375, -0.23244476318359375, -0.21234130859375, -0.19223785400390625, -0.1721343994140625, -0.15203094482421875, -0.131927490234375, -0.11182403564453125, -0.0917205810546875, -0.07161712646484375, -0.051513671875, -0.03141021728515625, -0.0113067626953125, 0.00879669189453125, 0.028900146484375, 0.04900360107421875, 0.0691070556640625, 0.08921051025390625, 0.10931396484375, 0.12941741943359375, 0.1495208740234375, 0.16962432861328125, 0.189727783203125, 0.20983123779296875, 0.2299346923828125, 0.25003814697265625, 0.2701416015625, 0.29024505615234375, 0.3103485107421875, 0.33045196533203125, 0.350555419921875, 0.37065887451171875, 0.3907623291015625, 0.41086578369140625, 0.43096923828125, 0.45107269287109375, 0.4711761474609375, 0.49127960205078125, 0.511383056640625, 0.5314865112304688, 0.5515899658203125, 0.5716934204101562, 0.591796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 14.0, 12.0, 15.0, 17.0, 26.0, 30.0, 36.0, 31.0, 44.0, 51.0, 55.0, 80.0, 65.0, 90.0, 67.0, 57.0, 50.0, 43.0, 40.0, 27.0, 17.0, 20.0, 17.0, 15.0, 10.0, 10.0, 6.0, 4.0, 8.0, 7.0, 2.0, 4.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.13055419921875, -0.12646484375, -0.12237548828125, -0.1182861328125, -0.11419677734375, -0.110107421875, -0.10601806640625, -0.1019287109375, -0.09783935546875, -0.09375, -0.08966064453125, -0.0855712890625, -0.08148193359375, -0.077392578125, -0.07330322265625, -0.0692138671875, -0.06512451171875, -0.06103515625, -0.05694580078125, -0.0528564453125, -0.04876708984375, -0.044677734375, -0.04058837890625, -0.0364990234375, -0.03240966796875, -0.0283203125, -0.02423095703125, -0.0201416015625, -0.01605224609375, -0.011962890625, -0.00787353515625, -0.0037841796875, 0.00030517578125, 0.00439453125, 0.00848388671875, 0.0125732421875, 0.01666259765625, 0.020751953125, 0.02484130859375, 0.0289306640625, 0.03302001953125, 0.037109375, 0.04119873046875, 0.0452880859375, 0.04937744140625, 0.053466796875, 0.05755615234375, 0.0616455078125, 0.06573486328125, 0.06982421875, 0.07391357421875, 0.0780029296875, 0.08209228515625, 0.086181640625, 0.09027099609375, 0.0943603515625, 0.09844970703125, 0.1025390625, 0.10662841796875, 0.1107177734375, 0.11480712890625, 0.118896484375, 0.12298583984375, 0.1270751953125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 15.0, 35.0, 107.0, 206.0, 305.0, 174.0, 88.0, 32.0, 17.0, 11.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.790182113647461, -5.328359127044678, -4.866536617279053, -4.4047136306762695, -3.9428911209106445, -3.4810681343078613, -3.0192453861236572, -2.557422637939453, -2.095599889755249, -1.633777141571045, -1.1719543933868408, -0.7101315259933472, -0.24830877780914307, 0.21351408958435059, 0.6753368377685547, 1.1371595859527588, 1.598982334136963, 2.060805082321167, 2.522627830505371, 2.9844508171081543, 3.4462733268737793, 3.9080963134765625, 4.3699188232421875, 4.831741809844971, 5.293564796447754, 5.755387783050537, 6.217210292816162, 6.679033279418945, 7.14085578918457, 7.6026787757873535, 8.064501762390137, 8.526324272155762, 8.988146781921387, 9.449969291687012, 9.911792755126953, 10.373615264892578, 10.835437774658203, 11.297260284423828, 11.75908374786377, 12.220906257629395, 12.68272876739502, 13.144551277160645, 13.606374740600586, 14.068197250366211, 14.530019760131836, 14.991842269897461, 15.453665733337402, 15.915488243103027, 16.37731170654297, 16.839134216308594, 17.30095672607422, 17.762779235839844, 18.2246036529541, 18.686426162719727, 19.14824867248535, 19.610071182250977, 20.0718936920166, 20.533716201782227, 20.99553871154785, 21.457361221313477, 21.919185638427734, 22.38100814819336, 22.842830657958984, 23.30465316772461, 23.766475677490234]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 8.0, 4.0, 14.0, 14.0, 26.0, 32.0, 42.0, 51.0, 49.0, 92.0, 92.0, 84.0, 93.0, 74.0, 70.0, 61.0, 45.0, 37.0, 28.0, 32.0, 17.0, 7.0, 8.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.942391872406006, -5.76731538772583, -5.592238426208496, -5.41716194152832, -5.2420854568481445, -5.067008972167969, -4.891932010650635, -4.716855525970459, -4.541778564453125, -4.366702079772949, -4.191625118255615, -4.0165486335754395, -3.8414721488952637, -3.666395425796509, -3.491318702697754, -3.316242218017578, -3.1411657333374023, -2.9660890102386475, -2.7910125255584717, -2.615935802459717, -2.440859317779541, -2.265782594680786, -2.0907058715820312, -1.915629267692566, -1.7405526638031006, -1.5654760599136353, -1.39039945602417, -1.215322732925415, -1.0402461290359497, -0.8651695251464844, -0.6900928020477295, -0.5150161981582642, -0.3399391174316406, -0.1648624837398529, 0.010214149951934814, 0.18529081344604492, 0.36036741733551025, 0.5354440212249756, 0.7105207443237305, 0.8855973482131958, 1.0606739521026611, 1.2357505559921265, 1.4108271598815918, 1.5859038829803467, 1.760980486869812, 1.9360570907592773, 2.1111338138580322, 2.286210536956787, 2.461287021636963, 2.6363637447357178, 2.8114402294158936, 2.9865169525146484, 3.161593437194824, 3.336670160293579, 3.511746883392334, 3.6868233680725098, 3.8619000911712646, 4.0369768142700195, 4.212053298950195, 4.387129783630371, 4.562206745147705, 4.737283229827881, 4.912360191345215, 5.087436676025391, 5.262513160705566]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 7.0, 4.0, 8.0, 8.0, 11.0, 32.0, 32.0, 53.0, 89.0, 147.0, 250.0, 425.0, 803.0, 1567.0, 3432.0, 8851.0, 29017.0, 147637.0, 629087.0, 176607.0, 33114.0, 9974.0, 3749.0, 1705.0, 864.0, 446.0, 251.0, 148.0, 90.0, 58.0, 27.0, 27.0, 18.0, 6.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6484375, -4.517669677734375, -4.38690185546875, -4.256134033203125, -4.1253662109375, -3.994598388671875, -3.86383056640625, -3.733062744140625, -3.602294921875, -3.471527099609375, -3.34075927734375, -3.209991455078125, -3.0792236328125, -2.948455810546875, -2.81768798828125, -2.686920166015625, -2.55615234375, -2.425384521484375, -2.29461669921875, -2.163848876953125, -2.0330810546875, -1.902313232421875, -1.77154541015625, -1.640777587890625, -1.510009765625, -1.379241943359375, -1.24847412109375, -1.117706298828125, -0.9869384765625, -0.856170654296875, -0.72540283203125, -0.594635009765625, -0.4638671875, -0.333099365234375, -0.20233154296875, -0.071563720703125, 0.0592041015625, 0.189971923828125, 0.32073974609375, 0.451507568359375, 0.582275390625, 0.713043212890625, 0.84381103515625, 0.974578857421875, 1.1053466796875, 1.236114501953125, 1.36688232421875, 1.497650146484375, 1.62841796875, 1.759185791015625, 1.88995361328125, 2.020721435546875, 2.1514892578125, 2.282257080078125, 2.41302490234375, 2.543792724609375, 2.674560546875, 2.805328369140625, 2.93609619140625, 3.066864013671875, 3.1976318359375, 3.328399658203125, 3.45916748046875, 3.589935302734375, 3.720703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 12.0, 19.0, 20.0, 30.0, 41.0, 42.0, 62.0, 80.0, 80.0, 97.0, 99.0, 76.0, 70.0, 61.0, 43.0, 38.0, 29.0, 34.0, 24.0, 7.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.546875, -15.117919921875, -14.68896484375, -14.260009765625, -13.8310546875, -13.402099609375, -12.97314453125, -12.544189453125, -12.115234375, -11.686279296875, -11.25732421875, -10.828369140625, -10.3994140625, -9.970458984375, -9.54150390625, -9.112548828125, -8.68359375, -8.254638671875, -7.82568359375, -7.396728515625, -6.9677734375, -6.538818359375, -6.10986328125, -5.680908203125, -5.251953125, -4.822998046875, -4.39404296875, -3.965087890625, -3.5361328125, -3.107177734375, -2.67822265625, -2.249267578125, -1.8203125, -1.391357421875, -0.96240234375, -0.533447265625, -0.1044921875, 0.324462890625, 0.75341796875, 1.182373046875, 1.611328125, 2.040283203125, 2.46923828125, 2.898193359375, 3.3271484375, 3.756103515625, 4.18505859375, 4.614013671875, 5.04296875, 5.471923828125, 5.90087890625, 6.329833984375, 6.7587890625, 7.187744140625, 7.61669921875, 8.045654296875, 8.474609375, 8.903564453125, 9.33251953125, 9.761474609375, 10.1904296875, 10.619384765625, 11.04833984375, 11.477294921875, 11.90625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 9.0, 10.0, 13.0, 24.0, 40.0, 33.0, 63.0, 68.0, 102.0, 117.0, 229.0, 459.0, 1027.0, 3240.0, 14592.0, 137748.0, 775267.0, 98878.0, 11794.0, 2783.0, 940.0, 418.0, 190.0, 134.0, 88.0, 66.0, 43.0, 46.0, 24.0, 28.0, 16.0, 13.0, 8.0, 6.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.484375, -5.32513427734375, -5.1658935546875, -5.00665283203125, -4.847412109375, -4.68817138671875, -4.5289306640625, -4.36968994140625, -4.21044921875, -4.05120849609375, -3.8919677734375, -3.73272705078125, -3.573486328125, -3.41424560546875, -3.2550048828125, -3.09576416015625, -2.9365234375, -2.77728271484375, -2.6180419921875, -2.45880126953125, -2.299560546875, -2.14031982421875, -1.9810791015625, -1.82183837890625, -1.66259765625, -1.50335693359375, -1.3441162109375, -1.18487548828125, -1.025634765625, -0.86639404296875, -0.7071533203125, -0.54791259765625, -0.388671875, -0.22943115234375, -0.0701904296875, 0.08905029296875, 0.248291015625, 0.40753173828125, 0.5667724609375, 0.72601318359375, 0.88525390625, 1.04449462890625, 1.2037353515625, 1.36297607421875, 1.522216796875, 1.68145751953125, 1.8406982421875, 1.99993896484375, 2.1591796875, 2.31842041015625, 2.4776611328125, 2.63690185546875, 2.796142578125, 2.95538330078125, 3.1146240234375, 3.27386474609375, 3.43310546875, 3.59234619140625, 3.7515869140625, 3.91082763671875, 4.070068359375, 4.22930908203125, 4.3885498046875, 4.54779052734375, 4.70703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 4.0, 3.0, 9.0, 10.0, 21.0, 25.0, 24.0, 20.0, 31.0, 38.0, 43.0, 40.0, 52.0, 57.0, 54.0, 51.0, 44.0, 70.0, 48.0, 39.0, 45.0, 51.0, 34.0, 32.0, 28.0, 24.0, 29.0, 13.0, 16.0, 12.0, 5.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7421875, -10.383544921875, -10.02490234375, -9.666259765625, -9.3076171875, -8.948974609375, -8.59033203125, -8.231689453125, -7.873046875, -7.514404296875, -7.15576171875, -6.797119140625, -6.4384765625, -6.079833984375, -5.72119140625, -5.362548828125, -5.00390625, -4.645263671875, -4.28662109375, -3.927978515625, -3.5693359375, -3.210693359375, -2.85205078125, -2.493408203125, -2.134765625, -1.776123046875, -1.41748046875, -1.058837890625, -0.7001953125, -0.341552734375, 0.01708984375, 0.375732421875, 0.734375, 1.093017578125, 1.45166015625, 1.810302734375, 2.1689453125, 2.527587890625, 2.88623046875, 3.244873046875, 3.603515625, 3.962158203125, 4.32080078125, 4.679443359375, 5.0380859375, 5.396728515625, 5.75537109375, 6.114013671875, 6.47265625, 6.831298828125, 7.18994140625, 7.548583984375, 7.9072265625, 8.265869140625, 8.62451171875, 8.983154296875, 9.341796875, 9.700439453125, 10.05908203125, 10.417724609375, 10.7763671875, 11.135009765625, 11.49365234375, 11.852294921875, 12.2109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 11.0, 5.0, 21.0, 20.0, 40.0, 54.0, 92.0, 132.0, 252.0, 503.0, 1041.0, 2455.0, 7247.0, 31399.0, 197328.0, 652133.0, 124641.0, 21541.0, 5567.0, 2023.0, 889.0, 461.0, 240.0, 137.0, 94.0, 63.0, 47.0, 16.0, 19.0, 17.0, 6.0, 8.0, 2.0, 3.0, 2.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1845703125, -1.1428375244140625, -1.101104736328125, -1.0593719482421875, -1.01763916015625, -0.9759063720703125, -0.934173583984375, -0.8924407958984375, -0.8507080078125, -0.8089752197265625, -0.767242431640625, -0.7255096435546875, -0.68377685546875, -0.6420440673828125, -0.600311279296875, -0.5585784912109375, -0.516845703125, -0.4751129150390625, -0.433380126953125, -0.3916473388671875, -0.34991455078125, -0.3081817626953125, -0.266448974609375, -0.2247161865234375, -0.1829833984375, -0.1412506103515625, -0.099517822265625, -0.0577850341796875, -0.01605224609375, 0.0256805419921875, 0.067413330078125, 0.1091461181640625, 0.15087890625, 0.1926116943359375, 0.234344482421875, 0.2760772705078125, 0.31781005859375, 0.3595428466796875, 0.401275634765625, 0.4430084228515625, 0.4847412109375, 0.5264739990234375, 0.568206787109375, 0.6099395751953125, 0.65167236328125, 0.6934051513671875, 0.735137939453125, 0.7768707275390625, 0.818603515625, 0.8603363037109375, 0.902069091796875, 0.9438018798828125, 0.98553466796875, 1.0272674560546875, 1.069000244140625, 1.1107330322265625, 1.1524658203125, 1.1941986083984375, 1.235931396484375, 1.2776641845703125, 1.31939697265625, 1.3611297607421875, 1.402862548828125, 1.4445953369140625, 1.486328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 12.0, 12.0, 15.0, 14.0, 37.0, 39.0, 49.0, 66.0, 97.0, 117.0, 123.0, 88.0, 75.0, 59.0, 43.0, 38.0, 38.0, 13.0, 16.0, 10.0, 4.0, 5.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002123117446899414, -0.00020629167556762695, -0.0002002716064453125, -0.00019425153732299805, -0.0001882314682006836, -0.00018221139907836914, -0.0001761913299560547, -0.00017017126083374023, -0.00016415119171142578, -0.00015813112258911133, -0.00015211105346679688, -0.00014609098434448242, -0.00014007091522216797, -0.00013405084609985352, -0.00012803077697753906, -0.00012201070785522461, -0.00011599063873291016, -0.0001099705696105957, -0.00010395050048828125, -9.79304313659668e-05, -9.191036224365234e-05, -8.589029312133789e-05, -7.987022399902344e-05, -7.385015487670898e-05, -6.783008575439453e-05, -6.181001663208008e-05, -5.5789947509765625e-05, -4.976987838745117e-05, -4.374980926513672e-05, -3.7729740142822266e-05, -3.170967102050781e-05, -2.568960189819336e-05, -1.9669532775878906e-05, -1.3649463653564453e-05, -7.62939453125e-06, -1.6093254089355469e-06, 4.410743713378906e-06, 1.043081283569336e-05, 1.6450881958007812e-05, 2.2470951080322266e-05, 2.849102020263672e-05, 3.451108932495117e-05, 4.0531158447265625e-05, 4.655122756958008e-05, 5.257129669189453e-05, 5.8591365814208984e-05, 6.461143493652344e-05, 7.063150405883789e-05, 7.665157318115234e-05, 8.26716423034668e-05, 8.869171142578125e-05, 9.47117805480957e-05, 0.00010073184967041016, 0.00010675191879272461, 0.00011277198791503906, 0.00011879205703735352, 0.00012481212615966797, 0.00013083219528198242, 0.00013685226440429688, 0.00014287233352661133, 0.00014889240264892578, 0.00015491247177124023, 0.0001609325408935547, 0.00016695261001586914, 0.0001729726791381836]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 12.0, 25.0, 22.0, 36.0, 51.0, 67.0, 126.0, 191.0, 332.0, 604.0, 1243.0, 2655.0, 6156.0, 17062.0, 59246.0, 275438.0, 529469.0, 110626.0, 28248.0, 9400.0, 3878.0, 1743.0, 830.0, 402.0, 211.0, 146.0, 88.0, 62.0, 40.0, 29.0, 26.0, 14.0, 15.0, 5.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.16015625, -1.1252288818359375, -1.090301513671875, -1.0553741455078125, -1.02044677734375, -0.9855194091796875, -0.950592041015625, -0.9156646728515625, -0.8807373046875, -0.8458099365234375, -0.810882568359375, -0.7759552001953125, -0.74102783203125, -0.7061004638671875, -0.671173095703125, -0.6362457275390625, -0.601318359375, -0.5663909912109375, -0.531463623046875, -0.4965362548828125, -0.46160888671875, -0.4266815185546875, -0.391754150390625, -0.3568267822265625, -0.3218994140625, -0.2869720458984375, -0.252044677734375, -0.2171173095703125, -0.18218994140625, -0.1472625732421875, -0.112335205078125, -0.0774078369140625, -0.04248046875, -0.0075531005859375, 0.027374267578125, 0.0623016357421875, 0.09722900390625, 0.1321563720703125, 0.167083740234375, 0.2020111083984375, 0.2369384765625, 0.2718658447265625, 0.306793212890625, 0.3417205810546875, 0.37664794921875, 0.4115753173828125, 0.446502685546875, 0.4814300537109375, 0.516357421875, 0.5512847900390625, 0.586212158203125, 0.6211395263671875, 0.65606689453125, 0.6909942626953125, 0.725921630859375, 0.7608489990234375, 0.7957763671875, 0.8307037353515625, 0.865631103515625, 0.9005584716796875, 0.93548583984375, 0.9704132080078125, 1.005340576171875, 1.0402679443359375, 1.0751953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 5.0, 3.0, 8.0, 10.0, 6.0, 11.0, 14.0, 12.0, 25.0, 33.0, 30.0, 35.0, 37.0, 49.0, 50.0, 77.0, 89.0, 90.0, 70.0, 68.0, 54.0, 31.0, 30.0, 24.0, 21.0, 17.0, 18.0, 20.0, 11.0, 7.0, 3.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.537109375, -0.5192642211914062, -0.5014190673828125, -0.48357391357421875, -0.465728759765625, -0.44788360595703125, -0.4300384521484375, -0.41219329833984375, -0.39434814453125, -0.37650299072265625, -0.3586578369140625, -0.34081268310546875, -0.322967529296875, -0.30512237548828125, -0.2872772216796875, -0.26943206787109375, -0.2515869140625, -0.23374176025390625, -0.2158966064453125, -0.19805145263671875, -0.180206298828125, -0.16236114501953125, -0.1445159912109375, -0.12667083740234375, -0.10882568359375, -0.09098052978515625, -0.0731353759765625, -0.05529022216796875, -0.037445068359375, -0.01959991455078125, -0.0017547607421875, 0.01609039306640625, 0.033935546875, 0.05178070068359375, 0.0696258544921875, 0.08747100830078125, 0.105316162109375, 0.12316131591796875, 0.1410064697265625, 0.15885162353515625, 0.17669677734375, 0.19454193115234375, 0.2123870849609375, 0.23023223876953125, 0.248077392578125, 0.26592254638671875, 0.2837677001953125, 0.30161285400390625, 0.3194580078125, 0.33730316162109375, 0.3551483154296875, 0.37299346923828125, 0.390838623046875, 0.40868377685546875, 0.4265289306640625, 0.44437408447265625, 0.46221923828125, 0.48006439208984375, 0.4979095458984375, 0.5157546997070312, 0.533599853515625, 0.5514450073242188, 0.5692901611328125, 0.5871353149414062, 0.60498046875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 9.0, 36.0, 95.0, 299.0, 361.0, 134.0, 41.0, 18.0, 8.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.893125534057617, -22.651193618774414, -21.409259796142578, -20.167327880859375, -18.925395965576172, -17.68346405029297, -16.441532135009766, -15.19959831237793, -13.957666397094727, -12.715734481811523, -11.473801612854004, -10.231868743896484, -8.989936828613281, -7.74800443649292, -6.506072044372559, -5.264139175415039, -4.022207260131836, -2.7802748680114746, -1.5383424758911133, -0.29641008377075195, 0.9455223083496094, 2.1874547004699707, 3.429387092590332, 4.671319961547852, 5.913251876831055, 7.155184268951416, 8.397116661071777, 9.639049530029297, 10.8809814453125, 12.122913360595703, 13.364846229553223, 14.606779098510742, 15.848712921142578, 17.09064483642578, 18.332576751708984, 19.57451057434082, 20.816442489624023, 22.058374404907227, 23.300308227539062, 24.542240142822266, 25.78417205810547, 27.026103973388672, 28.268035888671875, 29.50996971130371, 30.751901626586914, 31.993833541870117, 33.23576736450195, 34.477699279785156, 35.71963119506836, 36.96156311035156, 38.203495025634766, 39.44542694091797, 40.68736267089844, 41.92929458618164, 43.171226501464844, 44.41315841674805, 45.65509033203125, 46.89702224731445, 48.138954162597656, 49.38088607788086, 50.62281799316406, 51.86475372314453, 53.106685638427734, 54.34861755371094, 55.59054946899414]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 9.0, 5.0, 10.0, 12.0, 11.0, 24.0, 20.0, 22.0, 17.0, 24.0, 33.0, 37.0, 30.0, 25.0, 36.0, 39.0, 40.0, 40.0, 45.0, 45.0, 40.0, 53.0, 46.0, 32.0, 29.0, 35.0, 24.0, 31.0, 28.0, 32.0, 24.0, 13.0, 13.0, 16.0, 13.0, 14.0, 8.0, 5.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0], "bins": [-18.27943992614746, -17.77526092529297, -17.271081924438477, -16.766902923583984, -16.26272201538086, -15.758543968200684, -15.254364013671875, -14.750185012817383, -14.24600601196289, -13.741827011108398, -13.237648010253906, -12.733468055725098, -12.229289054870605, -11.725110054016113, -11.220930099487305, -10.716751098632812, -10.21257209777832, -9.708393096923828, -9.204214096069336, -8.700034141540527, -8.195855140686035, -7.691676139831543, -7.187496662139893, -6.683317184448242, -6.17913818359375, -5.674959182739258, -5.170779705047607, -4.666600227355957, -4.162421226501465, -3.6582419872283936, -3.1540627479553223, -2.649883508682251, -2.145705223083496, -1.6415259838104248, -1.1373467445373535, -0.6331675052642822, -0.12898826599121094, 0.37519097328186035, 0.8793702125549316, 1.383549451828003, 1.8877286911010742, 2.3919079303741455, 2.896087169647217, 3.400266408920288, 3.9044456481933594, 4.408624649047852, 4.912804126739502, 5.416983604431152, 5.9211626052856445, 6.425341606140137, 6.929521083831787, 7.4337005615234375, 7.93787956237793, 8.442058563232422, 8.946237564086914, 9.450417518615723, 9.954596519470215, 10.458775520324707, 10.962955474853516, 11.467134475708008, 11.9713134765625, 12.475492477416992, 12.979671478271484, 13.483851432800293, 13.988030433654785]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 12.0, 21.0, 52.0, 77.0, 179.0, 385.0, 869.0, 2071.0, 5376.0, 18121.0, 108619.0, 1881463.0, 2035230.0, 114075.0, 18938.0, 5304.0, 1903.0, 811.0, 340.0, 184.0, 102.0, 52.0, 34.0, 18.0, 16.0, 6.0, 5.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0078125, -5.721923828125, -5.43603515625, -5.150146484375, -4.8642578125, -4.578369140625, -4.29248046875, -4.006591796875, -3.720703125, -3.434814453125, -3.14892578125, -2.863037109375, -2.5771484375, -2.291259765625, -2.00537109375, -1.719482421875, -1.43359375, -1.147705078125, -0.86181640625, -0.575927734375, -0.2900390625, -0.004150390625, 0.28173828125, 0.567626953125, 0.853515625, 1.139404296875, 1.42529296875, 1.711181640625, 1.9970703125, 2.282958984375, 2.56884765625, 2.854736328125, 3.140625, 3.426513671875, 3.71240234375, 3.998291015625, 4.2841796875, 4.570068359375, 4.85595703125, 5.141845703125, 5.427734375, 5.713623046875, 5.99951171875, 6.285400390625, 6.5712890625, 6.857177734375, 7.14306640625, 7.428955078125, 7.71484375, 8.000732421875, 8.28662109375, 8.572509765625, 8.8583984375, 9.144287109375, 9.43017578125, 9.716064453125, 10.001953125, 10.287841796875, 10.57373046875, 10.859619140625, 11.1455078125, 11.431396484375, 11.71728515625, 12.003173828125, 12.2890625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 1.0, 5.0, 5.0, 14.0, 10.0, 17.0, 36.0, 46.0, 51.0, 78.0, 99.0, 104.0, 128.0, 87.0, 97.0, 56.0, 57.0, 44.0, 24.0, 13.0, 13.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.1964111328125, -7.916259765625, -7.6361083984375, -7.35595703125, -7.0758056640625, -6.795654296875, -6.5155029296875, -6.2353515625, -5.9552001953125, -5.675048828125, -5.3948974609375, -5.11474609375, -4.8345947265625, -4.554443359375, -4.2742919921875, -3.994140625, -3.7139892578125, -3.433837890625, -3.1536865234375, -2.87353515625, -2.5933837890625, -2.313232421875, -2.0330810546875, -1.7529296875, -1.4727783203125, -1.192626953125, -0.9124755859375, -0.63232421875, -0.3521728515625, -0.072021484375, 0.2081298828125, 0.48828125, 0.7684326171875, 1.048583984375, 1.3287353515625, 1.60888671875, 1.8890380859375, 2.169189453125, 2.4493408203125, 2.7294921875, 3.0096435546875, 3.289794921875, 3.5699462890625, 3.85009765625, 4.1302490234375, 4.410400390625, 4.6905517578125, 4.970703125, 5.2508544921875, 5.531005859375, 5.8111572265625, 6.09130859375, 6.3714599609375, 6.651611328125, 6.9317626953125, 7.2119140625, 7.4920654296875, 7.772216796875, 8.0523681640625, 8.33251953125, 8.6126708984375, 8.892822265625, 9.1729736328125, 9.453125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 9.0, 6.0, 16.0, 13.0, 25.0, 34.0, 35.0, 68.0, 121.0, 204.0, 443.0, 1215.0, 4322.0, 22133.0, 224127.0, 3667950.0, 243732.0, 23027.0, 4540.0, 1279.0, 457.0, 210.0, 105.0, 77.0, 39.0, 28.0, 26.0, 10.0, 14.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.1328125, -9.8211669921875, -9.509521484375, -9.1978759765625, -8.88623046875, -8.5745849609375, -8.262939453125, -7.9512939453125, -7.6396484375, -7.3280029296875, -7.016357421875, -6.7047119140625, -6.39306640625, -6.0814208984375, -5.769775390625, -5.4581298828125, -5.146484375, -4.8348388671875, -4.523193359375, -4.2115478515625, -3.89990234375, -3.5882568359375, -3.276611328125, -2.9649658203125, -2.6533203125, -2.3416748046875, -2.030029296875, -1.7183837890625, -1.40673828125, -1.0950927734375, -0.783447265625, -0.4718017578125, -0.16015625, 0.1514892578125, 0.463134765625, 0.7747802734375, 1.08642578125, 1.3980712890625, 1.709716796875, 2.0213623046875, 2.3330078125, 2.6446533203125, 2.956298828125, 3.2679443359375, 3.57958984375, 3.8912353515625, 4.202880859375, 4.5145263671875, 4.826171875, 5.1378173828125, 5.449462890625, 5.7611083984375, 6.07275390625, 6.3843994140625, 6.696044921875, 7.0076904296875, 7.3193359375, 7.6309814453125, 7.942626953125, 8.2542724609375, 8.56591796875, 8.8775634765625, 9.189208984375, 9.5008544921875, 9.8125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 7.0, 7.0, 13.0, 15.0, 23.0, 29.0, 52.0, 71.0, 87.0, 156.0, 270.0, 408.0, 670.0, 688.0, 567.0, 355.0, 219.0, 118.0, 70.0, 68.0, 42.0, 34.0, 20.0, 20.0, 19.0, 11.0, 7.0, 4.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.255859375, -2.188262939453125, -2.12066650390625, -2.053070068359375, -1.9854736328125, -1.917877197265625, -1.85028076171875, -1.782684326171875, -1.715087890625, -1.647491455078125, -1.57989501953125, -1.512298583984375, -1.4447021484375, -1.377105712890625, -1.30950927734375, -1.241912841796875, -1.17431640625, -1.106719970703125, -1.03912353515625, -0.971527099609375, -0.9039306640625, -0.836334228515625, -0.76873779296875, -0.701141357421875, -0.633544921875, -0.565948486328125, -0.49835205078125, -0.430755615234375, -0.3631591796875, -0.295562744140625, -0.22796630859375, -0.160369873046875, -0.0927734375, -0.025177001953125, 0.04241943359375, 0.110015869140625, 0.1776123046875, 0.245208740234375, 0.31280517578125, 0.380401611328125, 0.447998046875, 0.515594482421875, 0.58319091796875, 0.650787353515625, 0.7183837890625, 0.785980224609375, 0.85357666015625, 0.921173095703125, 0.98876953125, 1.056365966796875, 1.12396240234375, 1.191558837890625, 1.2591552734375, 1.326751708984375, 1.39434814453125, 1.461944580078125, 1.529541015625, 1.597137451171875, 1.66473388671875, 1.732330322265625, 1.7999267578125, 1.867523193359375, 1.93511962890625, 2.002716064453125, 2.0703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 6.0, 13.0, 18.0, 32.0, 63.0, 103.0, 214.0, 205.0, 148.0, 94.0, 59.0, 19.0, 15.0, 8.0, 5.0, 5.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9347662925720215, -5.412812232971191, -4.8908586502075195, -4.368905067443848, -3.8469510078430176, -3.3249971866607666, -2.8030433654785156, -2.2810895442962646, -1.7591357231140137, -1.2371819019317627, -0.7152280807495117, -0.19327425956726074, 0.32867956161499023, 0.8506333827972412, 1.3725872039794922, 1.8945410251617432, 2.416494846343994, 2.938448667526245, 3.460402488708496, 3.982356309890747, 4.504310131072998, 5.026264190673828, 5.5482177734375, 6.070171356201172, 6.592125415802002, 7.114079475402832, 7.636033058166504, 8.157986640930176, 8.679941177368164, 9.201894760131836, 9.723848342895508, 10.24580192565918, 10.767755508422852, 11.289709091186523, 11.811662673950195, 12.333617210388184, 12.855570793151855, 13.377524375915527, 13.899478912353516, 14.421432495117188, 14.94338607788086, 15.465339660644531, 15.987293243408203, 16.509246826171875, 17.031200408935547, 17.55315589904785, 18.075109481811523, 18.597063064575195, 19.119016647338867, 19.64097023010254, 20.16292381286621, 20.684877395629883, 21.206832885742188, 21.72878646850586, 22.25074005126953, 22.772693634033203, 23.294647216796875, 23.816600799560547, 24.33855438232422, 24.86050796508789, 25.382461547851562, 25.904417037963867, 26.42637062072754, 26.94832420349121, 27.470277786254883]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 1.0, 6.0, 10.0, 13.0, 25.0, 24.0, 21.0, 33.0, 31.0, 47.0, 57.0, 73.0, 65.0, 76.0, 58.0, 69.0, 76.0, 70.0, 49.0, 46.0, 41.0, 28.0, 16.0, 13.0, 16.0, 9.0, 10.0, 2.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.259030818939209, -7.041027069091797, -6.823023796081543, -6.605020046234131, -6.387016296386719, -6.169013023376465, -5.951009273529053, -5.733005523681641, -5.515002250671387, -5.296998500823975, -5.078995227813721, -4.860991477966309, -4.6429877281188965, -4.424984455108643, -4.2069807052612305, -3.9889771938323975, -3.7709734439849854, -3.5529699325561523, -3.3349661827087402, -3.1169626712799072, -2.898959159851074, -2.680955410003662, -2.462951898574829, -2.244948387145996, -2.026944637298584, -1.8089410066604614, -1.5909374952316284, -1.3729338645935059, -1.1549303531646729, -0.9369267225265503, -0.7189230918884277, -0.5009195804595947, -0.2829160690307617, -0.06491248309612274, 0.15309110283851624, 0.3710947036743164, 0.5890982747077942, 0.807101845741272, 1.0251054763793945, 1.2431089878082275, 1.46111261844635, 1.6791162490844727, 1.8971197605133057, 2.1151232719421387, 2.333127021789551, 2.551130533218384, 2.769134044647217, 2.987137794494629, 3.205141305923462, 3.423144817352295, 3.641148567199707, 3.85915207862854, 4.077155590057373, 4.295159339904785, 4.513162612915039, 4.731166362762451, 4.949170112609863, 5.167173862457275, 5.385177135467529, 5.603180885314941, 5.8211846351623535, 6.039187908172607, 6.2571916580200195, 6.475194931030273, 6.6931986808776855]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 6.0, 10.0, 8.0, 21.0, 23.0, 28.0, 63.0, 98.0, 186.0, 358.0, 631.0, 1432.0, 3807.0, 11427.0, 40153.0, 178351.0, 553683.0, 195354.0, 43454.0, 12361.0, 4054.0, 1647.0, 664.0, 306.0, 134.0, 105.0, 68.0, 34.0, 28.0, 16.0, 13.0, 4.0, 9.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.80859375, -1.747344970703125, -1.68609619140625, -1.624847412109375, -1.5635986328125, -1.502349853515625, -1.44110107421875, -1.379852294921875, -1.318603515625, -1.257354736328125, -1.19610595703125, -1.134857177734375, -1.0736083984375, -1.012359619140625, -0.95111083984375, -0.889862060546875, -0.82861328125, -0.767364501953125, -0.70611572265625, -0.644866943359375, -0.5836181640625, -0.522369384765625, -0.46112060546875, -0.399871826171875, -0.338623046875, -0.277374267578125, -0.21612548828125, -0.154876708984375, -0.0936279296875, -0.032379150390625, 0.02886962890625, 0.090118408203125, 0.1513671875, 0.212615966796875, 0.27386474609375, 0.335113525390625, 0.3963623046875, 0.457611083984375, 0.51885986328125, 0.580108642578125, 0.641357421875, 0.702606201171875, 0.76385498046875, 0.825103759765625, 0.8863525390625, 0.947601318359375, 1.00885009765625, 1.070098876953125, 1.13134765625, 1.192596435546875, 1.25384521484375, 1.315093994140625, 1.3763427734375, 1.437591552734375, 1.49884033203125, 1.560089111328125, 1.621337890625, 1.682586669921875, 1.74383544921875, 1.805084228515625, 1.8663330078125, 1.927581787109375, 1.98883056640625, 2.050079345703125, 2.111328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 2.0, 7.0, 6.0, 18.0, 13.0, 19.0, 33.0, 28.0, 40.0, 55.0, 73.0, 67.0, 84.0, 74.0, 72.0, 84.0, 75.0, 58.0, 45.0, 39.0, 29.0, 14.0, 15.0, 14.0, 9.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2109375, -5.0560302734375, -4.901123046875, -4.7462158203125, -4.59130859375, -4.4364013671875, -4.281494140625, -4.1265869140625, -3.9716796875, -3.8167724609375, -3.661865234375, -3.5069580078125, -3.35205078125, -3.1971435546875, -3.042236328125, -2.8873291015625, -2.732421875, -2.5775146484375, -2.422607421875, -2.2677001953125, -2.11279296875, -1.9578857421875, -1.802978515625, -1.6480712890625, -1.4931640625, -1.3382568359375, -1.183349609375, -1.0284423828125, -0.87353515625, -0.7186279296875, -0.563720703125, -0.4088134765625, -0.25390625, -0.0989990234375, 0.055908203125, 0.2108154296875, 0.36572265625, 0.5206298828125, 0.675537109375, 0.8304443359375, 0.9853515625, 1.1402587890625, 1.295166015625, 1.4500732421875, 1.60498046875, 1.7598876953125, 1.914794921875, 2.0697021484375, 2.224609375, 2.3795166015625, 2.534423828125, 2.6893310546875, 2.84423828125, 2.9991455078125, 3.154052734375, 3.3089599609375, 3.4638671875, 3.6187744140625, 3.773681640625, 3.9285888671875, 4.08349609375, 4.2384033203125, 4.393310546875, 4.5482177734375, 4.703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 5.0, 10.0, 14.0, 14.0, 20.0, 32.0, 59.0, 72.0, 110.0, 170.0, 297.0, 479.0, 948.0, 2077.0, 4968.0, 13480.0, 40137.0, 148622.0, 461973.0, 271484.0, 68709.0, 21405.0, 7525.0, 3017.0, 1343.0, 651.0, 351.0, 186.0, 130.0, 86.0, 51.0, 31.0, 23.0, 17.0, 15.0, 13.0, 4.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3759765625, -1.3296661376953125, -1.283355712890625, -1.2370452880859375, -1.19073486328125, -1.1444244384765625, -1.098114013671875, -1.0518035888671875, -1.0054931640625, -0.9591827392578125, -0.912872314453125, -0.8665618896484375, -0.82025146484375, -0.7739410400390625, -0.727630615234375, -0.6813201904296875, -0.635009765625, -0.5886993408203125, -0.542388916015625, -0.4960784912109375, -0.44976806640625, -0.4034576416015625, -0.357147216796875, -0.3108367919921875, -0.2645263671875, -0.2182159423828125, -0.171905517578125, -0.1255950927734375, -0.07928466796875, -0.0329742431640625, 0.013336181640625, 0.0596466064453125, 0.10595703125, 0.1522674560546875, 0.198577880859375, 0.2448883056640625, 0.29119873046875, 0.3375091552734375, 0.383819580078125, 0.4301300048828125, 0.4764404296875, 0.5227508544921875, 0.569061279296875, 0.6153717041015625, 0.66168212890625, 0.7079925537109375, 0.754302978515625, 0.8006134033203125, 0.846923828125, 0.8932342529296875, 0.939544677734375, 0.9858551025390625, 1.03216552734375, 1.0784759521484375, 1.124786376953125, 1.1710968017578125, 1.2174072265625, 1.2637176513671875, 1.310028076171875, 1.3563385009765625, 1.40264892578125, 1.4489593505859375, 1.495269775390625, 1.5415802001953125, 1.587890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 14.0, 7.0, 17.0, 13.0, 16.0, 29.0, 26.0, 25.0, 48.0, 40.0, 42.0, 40.0, 50.0, 59.0, 56.0, 60.0, 44.0, 53.0, 36.0, 46.0, 45.0, 36.0, 25.0, 25.0, 25.0, 17.0, 21.0, 23.0, 15.0, 8.0, 8.0, 6.0, 8.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.058349609375, -5.82763671875, -5.596923828125, -5.3662109375, -5.135498046875, -4.90478515625, -4.674072265625, -4.443359375, -4.212646484375, -3.98193359375, -3.751220703125, -3.5205078125, -3.289794921875, -3.05908203125, -2.828369140625, -2.59765625, -2.366943359375, -2.13623046875, -1.905517578125, -1.6748046875, -1.444091796875, -1.21337890625, -0.982666015625, -0.751953125, -0.521240234375, -0.29052734375, -0.059814453125, 0.1708984375, 0.401611328125, 0.63232421875, 0.863037109375, 1.09375, 1.324462890625, 1.55517578125, 1.785888671875, 2.0166015625, 2.247314453125, 2.47802734375, 2.708740234375, 2.939453125, 3.170166015625, 3.40087890625, 3.631591796875, 3.8623046875, 4.093017578125, 4.32373046875, 4.554443359375, 4.78515625, 5.015869140625, 5.24658203125, 5.477294921875, 5.7080078125, 5.938720703125, 6.16943359375, 6.400146484375, 6.630859375, 6.861572265625, 7.09228515625, 7.322998046875, 7.5537109375, 7.784423828125, 8.01513671875, 8.245849609375, 8.4765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 9.0, 8.0, 8.0, 24.0, 40.0, 68.0, 105.0, 191.0, 355.0, 693.0, 1527.0, 3528.0, 9058.0, 27585.0, 114422.0, 485689.0, 313396.0, 63266.0, 17650.0, 6043.0, 2527.0, 1131.0, 576.0, 273.0, 140.0, 97.0, 46.0, 32.0, 17.0, 12.0, 7.0, 8.0, 5.0, 5.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.6777114868164062, -0.6557159423828125, -0.6337203979492188, -0.611724853515625, -0.5897293090820312, -0.5677337646484375, -0.5457382202148438, -0.52374267578125, -0.5017471313476562, -0.4797515869140625, -0.45775604248046875, -0.435760498046875, -0.41376495361328125, -0.3917694091796875, -0.36977386474609375, -0.3477783203125, -0.32578277587890625, -0.3037872314453125, -0.28179168701171875, -0.259796142578125, -0.23780059814453125, -0.2158050537109375, -0.19380950927734375, -0.17181396484375, -0.14981842041015625, -0.1278228759765625, -0.10582733154296875, -0.083831787109375, -0.06183624267578125, -0.0398406982421875, -0.01784515380859375, 0.004150390625, 0.02614593505859375, 0.0481414794921875, 0.07013702392578125, 0.092132568359375, 0.11412811279296875, 0.1361236572265625, 0.15811920166015625, 0.18011474609375, 0.20211029052734375, 0.2241058349609375, 0.24610137939453125, 0.268096923828125, 0.29009246826171875, 0.3120880126953125, 0.33408355712890625, 0.3560791015625, 0.37807464599609375, 0.4000701904296875, 0.42206573486328125, 0.444061279296875, 0.46605682373046875, 0.4880523681640625, 0.5100479125976562, 0.53204345703125, 0.5540390014648438, 0.5760345458984375, 0.5980300903320312, 0.620025634765625, 0.6420211791992188, 0.6640167236328125, 0.6860122680664062, 0.7080078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 4.0, 11.0, 6.0, 6.0, 2.0, 15.0, 9.0, 15.0, 10.0, 31.0, 33.0, 33.0, 50.0, 77.0, 60.0, 84.0, 99.0, 76.0, 73.0, 64.0, 42.0, 44.0, 29.0, 38.0, 24.0, 20.0, 10.0, 4.0, 9.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.000339508056640625, -0.0003306921571493149, -0.00032187625765800476, -0.00031306035816669464, -0.0003042444586753845, -0.0002954285591840744, -0.0002866126596927643, -0.00027779676020145416, -0.00026898086071014404, -0.0002601649612188339, -0.0002513490617275238, -0.00024253316223621368, -0.00023371726274490356, -0.00022490136325359344, -0.00021608546376228333, -0.0002072695642709732, -0.00019845366477966309, -0.00018963776528835297, -0.00018082186579704285, -0.00017200596630573273, -0.0001631900668144226, -0.0001543741673231125, -0.00014555826783180237, -0.00013674236834049225, -0.00012792646884918213, -0.00011911056935787201, -0.00011029466986656189, -0.00010147877037525177, -9.266287088394165e-05, -8.384697139263153e-05, -7.503107190132141e-05, -6.621517241001129e-05, -5.739927291870117e-05, -4.858337342739105e-05, -3.976747393608093e-05, -3.095157444477081e-05, -2.2135674953460693e-05, -1.3319775462150574e-05, -4.503875970840454e-06, 4.3120235204696655e-06, 1.3127923011779785e-05, 2.1943822503089905e-05, 3.0759721994400024e-05, 3.9575621485710144e-05, 4.8391520977020264e-05, 5.720742046833038e-05, 6.60233199596405e-05, 7.483921945095062e-05, 8.365511894226074e-05, 9.247101843357086e-05, 0.00010128691792488098, 0.0001101028174161911, 0.00011891871690750122, 0.00012773461639881134, 0.00013655051589012146, 0.00014536641538143158, 0.0001541823148727417, 0.00016299821436405182, 0.00017181411385536194, 0.00018063001334667206, 0.00018944591283798218, 0.0001982618123292923, 0.00020707771182060242, 0.00021589361131191254, 0.00022470951080322266]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 11.0, 9.0, 13.0, 20.0, 23.0, 39.0, 47.0, 59.0, 121.0, 147.0, 235.0, 399.0, 700.0, 1283.0, 2549.0, 5720.0, 13822.0, 40216.0, 142618.0, 427585.0, 291387.0, 79435.0, 24579.0, 9145.0, 3991.0, 1953.0, 987.0, 513.0, 339.0, 185.0, 112.0, 81.0, 70.0, 36.0, 33.0, 24.0, 11.0, 6.0, 8.0, 14.0, 7.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5595703125, -0.541961669921875, -0.52435302734375, -0.506744384765625, -0.4891357421875, -0.471527099609375, -0.45391845703125, -0.436309814453125, -0.418701171875, -0.401092529296875, -0.38348388671875, -0.365875244140625, -0.3482666015625, -0.330657958984375, -0.31304931640625, -0.295440673828125, -0.27783203125, -0.260223388671875, -0.24261474609375, -0.225006103515625, -0.2073974609375, -0.189788818359375, -0.17218017578125, -0.154571533203125, -0.136962890625, -0.119354248046875, -0.10174560546875, -0.084136962890625, -0.0665283203125, -0.048919677734375, -0.03131103515625, -0.013702392578125, 0.00390625, 0.021514892578125, 0.03912353515625, 0.056732177734375, 0.0743408203125, 0.091949462890625, 0.10955810546875, 0.127166748046875, 0.144775390625, 0.162384033203125, 0.17999267578125, 0.197601318359375, 0.2152099609375, 0.232818603515625, 0.25042724609375, 0.268035888671875, 0.28564453125, 0.303253173828125, 0.32086181640625, 0.338470458984375, 0.3560791015625, 0.373687744140625, 0.39129638671875, 0.408905029296875, 0.426513671875, 0.444122314453125, 0.46173095703125, 0.479339599609375, 0.4969482421875, 0.514556884765625, 0.53216552734375, 0.549774169921875, 0.5673828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 8.0, 6.0, 10.0, 12.0, 16.0, 14.0, 20.0, 21.0, 24.0, 33.0, 38.0, 32.0, 47.0, 55.0, 64.0, 66.0, 62.0, 64.0, 52.0, 56.0, 40.0, 42.0, 34.0, 30.0, 30.0, 20.0, 21.0, 11.0, 11.0, 10.0, 8.0, 6.0, 5.0, 3.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1219482421875, -0.11791229248046875, -0.1138763427734375, -0.10984039306640625, -0.105804443359375, -0.10176849365234375, -0.0977325439453125, -0.09369659423828125, -0.08966064453125, -0.08562469482421875, -0.0815887451171875, -0.07755279541015625, -0.073516845703125, -0.06948089599609375, -0.0654449462890625, -0.06140899658203125, -0.057373046875, -0.05333709716796875, -0.0493011474609375, -0.04526519775390625, -0.041229248046875, -0.03719329833984375, -0.0331573486328125, -0.02912139892578125, -0.02508544921875, -0.02104949951171875, -0.0170135498046875, -0.01297760009765625, -0.008941650390625, -0.00490570068359375, -0.0008697509765625, 0.00316619873046875, 0.0072021484375, 0.01123809814453125, 0.0152740478515625, 0.01930999755859375, 0.023345947265625, 0.02738189697265625, 0.0314178466796875, 0.03545379638671875, 0.03948974609375, 0.04352569580078125, 0.0475616455078125, 0.05159759521484375, 0.055633544921875, 0.05966949462890625, 0.0637054443359375, 0.06774139404296875, 0.07177734375, 0.07581329345703125, 0.0798492431640625, 0.08388519287109375, 0.087921142578125, 0.09195709228515625, 0.0959930419921875, 0.10002899169921875, 0.10406494140625, 0.10810089111328125, 0.1121368408203125, 0.11617279052734375, 0.120208740234375, 0.12424468994140625, 0.1282806396484375, 0.13231658935546875, 0.1363525390625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 5.0, 10.0, 22.0, 36.0, 76.0, 168.0, 256.0, 202.0, 113.0, 63.0, 20.0, 13.0, 13.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0867180824279785, -3.7099244594573975, -3.3331308364868164, -2.9563372135162354, -2.5795435905456543, -2.2027499675750732, -1.8259563446044922, -1.4491627216339111, -1.07236909866333, -0.695575475692749, -0.31878185272216797, 0.058011770248413086, 0.43480539321899414, 0.8115990161895752, 1.1883926391601562, 1.5651862621307373, 1.9419798851013184, 2.3187735080718994, 2.6955671310424805, 3.0723607540130615, 3.4491543769836426, 3.8259479999542236, 4.202741622924805, 4.579535484313965, 4.956328868865967, 5.333122253417969, 5.709916114807129, 6.086709976196289, 6.463503360748291, 6.840296745300293, 7.217090606689453, 7.593884468078613, 7.970678329467773, 8.347472190856934, 8.724266052246094, 9.101058959960938, 9.477852821350098, 9.854646682739258, 10.231439590454102, 10.608233451843262, 10.985027313232422, 11.361821174621582, 11.738615036010742, 12.115407943725586, 12.492201805114746, 12.868995666503906, 13.24578857421875, 13.62258243560791, 13.99937629699707, 14.37617015838623, 14.75296401977539, 15.129756927490234, 15.506550788879395, 15.883344650268555, 16.2601375579834, 16.636932373046875, 17.01372528076172, 17.390518188476562, 17.76731300354004, 18.144105911254883, 18.52090072631836, 18.897693634033203, 19.274486541748047, 19.651281356811523, 20.028074264526367]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 8.0, 19.0, 25.0, 25.0, 26.0, 46.0, 33.0, 58.0, 74.0, 74.0, 82.0, 68.0, 69.0, 75.0, 82.0, 57.0, 48.0, 28.0, 25.0, 18.0, 14.0, 8.0, 9.0, 4.0, 7.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.580511569976807, -4.429073810577393, -4.2776360511779785, -4.1261982917785645, -3.9747607707977295, -3.8233230113983154, -3.6718854904174805, -3.5204477310180664, -3.3690099716186523, -3.2175722122192383, -3.066134452819824, -2.9146969318389893, -2.763259172439575, -2.611821413040161, -2.460383892059326, -2.308946132659912, -2.157508373260498, -2.006070613861084, -1.8546329736709595, -1.703195333480835, -1.551757574081421, -1.4003198146820068, -1.2488821744918823, -1.0974445343017578, -0.9460067749023438, -0.7945690751075745, -0.6431313753128052, -0.4916936755180359, -0.3402559757232666, -0.18881827592849731, -0.03738057613372803, 0.11405706405639648, 0.26549482345581055, 0.41693252325057983, 0.5683702230453491, 0.7198079228401184, 0.8712456226348877, 1.0226833820343018, 1.1741210222244263, 1.3255586624145508, 1.4769964218139648, 1.628434181213379, 1.7798718214035034, 1.931309461593628, 2.082747220993042, 2.234184980392456, 2.385622501373291, 2.537060260772705, 2.688498020172119, 2.839935779571533, 2.9913735389709473, 3.1428110599517822, 3.2942488193511963, 3.4456865787506104, 3.5971240997314453, 3.7485618591308594, 3.8999996185302734, 4.0514373779296875, 4.202875137329102, 4.354312896728516, 4.50575065612793, 4.6571879386901855, 4.8086256980896, 4.960063457489014, 5.111501216888428]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 15.0, 18.0, 19.0, 31.0, 55.0, 60.0, 112.0, 165.0, 292.0, 488.0, 802.0, 1608.0, 3453.0, 7611.0, 19401.0, 64143.0, 334190.0, 487238.0, 87056.0, 24677.0, 9005.0, 3875.0, 1897.0, 928.0, 580.0, 320.0, 186.0, 122.0, 69.0, 47.0, 32.0, 21.0, 15.0, 8.0, 2.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5390625, -3.41314697265625, -3.2872314453125, -3.16131591796875, -3.035400390625, -2.90948486328125, -2.7835693359375, -2.65765380859375, -2.53173828125, -2.40582275390625, -2.2799072265625, -2.15399169921875, -2.028076171875, -1.90216064453125, -1.7762451171875, -1.65032958984375, -1.5244140625, -1.39849853515625, -1.2725830078125, -1.14666748046875, -1.020751953125, -0.89483642578125, -0.7689208984375, -0.64300537109375, -0.51708984375, -0.39117431640625, -0.2652587890625, -0.13934326171875, -0.013427734375, 0.11248779296875, 0.2384033203125, 0.36431884765625, 0.490234375, 0.61614990234375, 0.7420654296875, 0.86798095703125, 0.993896484375, 1.11981201171875, 1.2457275390625, 1.37164306640625, 1.49755859375, 1.62347412109375, 1.7493896484375, 1.87530517578125, 2.001220703125, 2.12713623046875, 2.2530517578125, 2.37896728515625, 2.5048828125, 2.63079833984375, 2.7567138671875, 2.88262939453125, 3.008544921875, 3.13446044921875, 3.2603759765625, 3.38629150390625, 3.51220703125, 3.63812255859375, 3.7640380859375, 3.88995361328125, 4.015869140625, 4.14178466796875, 4.2677001953125, 4.39361572265625, 4.51953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 14.0, 13.0, 26.0, 27.0, 28.0, 37.0, 46.0, 76.0, 61.0, 82.0, 66.0, 86.0, 71.0, 76.0, 57.0, 54.0, 44.0, 36.0, 19.0, 13.0, 18.0, 6.0, 6.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.5965576171875, -10.263427734375, -9.9302978515625, -9.59716796875, -9.2640380859375, -8.930908203125, -8.5977783203125, -8.2646484375, -7.9315185546875, -7.598388671875, -7.2652587890625, -6.93212890625, -6.5989990234375, -6.265869140625, -5.9327392578125, -5.599609375, -5.2664794921875, -4.933349609375, -4.6002197265625, -4.26708984375, -3.9339599609375, -3.600830078125, -3.2677001953125, -2.9345703125, -2.6014404296875, -2.268310546875, -1.9351806640625, -1.60205078125, -1.2689208984375, -0.935791015625, -0.6026611328125, -0.26953125, 0.0635986328125, 0.396728515625, 0.7298583984375, 1.06298828125, 1.3961181640625, 1.729248046875, 2.0623779296875, 2.3955078125, 2.7286376953125, 3.061767578125, 3.3948974609375, 3.72802734375, 4.0611572265625, 4.394287109375, 4.7274169921875, 5.060546875, 5.3936767578125, 5.726806640625, 6.0599365234375, 6.39306640625, 6.7261962890625, 7.059326171875, 7.3924560546875, 7.7255859375, 8.0587158203125, 8.391845703125, 8.7249755859375, 9.05810546875, 9.3912353515625, 9.724365234375, 10.0574951171875, 10.390625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 2.0, 8.0, 12.0, 20.0, 21.0, 31.0, 53.0, 59.0, 118.0, 226.0, 484.0, 1253.0, 4739.0, 28613.0, 394421.0, 570859.0, 38916.0, 5992.0, 1522.0, 536.0, 264.0, 148.0, 88.0, 51.0, 39.0, 16.0, 26.0, 19.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.466552734375, -4.27294921875, -4.079345703125, -3.8857421875, -3.692138671875, -3.49853515625, -3.304931640625, -3.111328125, -2.917724609375, -2.72412109375, -2.530517578125, -2.3369140625, -2.143310546875, -1.94970703125, -1.756103515625, -1.5625, -1.368896484375, -1.17529296875, -0.981689453125, -0.7880859375, -0.594482421875, -0.40087890625, -0.207275390625, -0.013671875, 0.179931640625, 0.37353515625, 0.567138671875, 0.7607421875, 0.954345703125, 1.14794921875, 1.341552734375, 1.53515625, 1.728759765625, 1.92236328125, 2.115966796875, 2.3095703125, 2.503173828125, 2.69677734375, 2.890380859375, 3.083984375, 3.277587890625, 3.47119140625, 3.664794921875, 3.8583984375, 4.052001953125, 4.24560546875, 4.439208984375, 4.6328125, 4.826416015625, 5.02001953125, 5.213623046875, 5.4072265625, 5.600830078125, 5.79443359375, 5.988037109375, 6.181640625, 6.375244140625, 6.56884765625, 6.762451171875, 6.9560546875, 7.149658203125, 7.34326171875, 7.536865234375, 7.73046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 12.0, 11.0, 19.0, 19.0, 14.0, 21.0, 33.0, 31.0, 38.0, 45.0, 23.0, 28.0, 53.0, 59.0, 59.0, 44.0, 57.0, 48.0, 53.0, 59.0, 36.0, 27.0, 32.0, 26.0, 26.0, 28.0, 15.0, 13.0, 14.0, 13.0, 6.0, 6.0, 3.0, 4.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2308349609375, -9.899169921875, -9.5675048828125, -9.23583984375, -8.9041748046875, -8.572509765625, -8.2408447265625, -7.9091796875, -7.5775146484375, -7.245849609375, -6.9141845703125, -6.58251953125, -6.2508544921875, -5.919189453125, -5.5875244140625, -5.255859375, -4.9241943359375, -4.592529296875, -4.2608642578125, -3.92919921875, -3.5975341796875, -3.265869140625, -2.9342041015625, -2.6025390625, -2.2708740234375, -1.939208984375, -1.6075439453125, -1.27587890625, -0.9442138671875, -0.612548828125, -0.2808837890625, 0.05078125, 0.3824462890625, 0.714111328125, 1.0457763671875, 1.37744140625, 1.7091064453125, 2.040771484375, 2.3724365234375, 2.7041015625, 3.0357666015625, 3.367431640625, 3.6990966796875, 4.03076171875, 4.3624267578125, 4.694091796875, 5.0257568359375, 5.357421875, 5.6890869140625, 6.020751953125, 6.3524169921875, 6.68408203125, 7.0157470703125, 7.347412109375, 7.6790771484375, 8.0107421875, 8.3424072265625, 8.674072265625, 9.0057373046875, 9.33740234375, 9.6690673828125, 10.000732421875, 10.3323974609375, 10.6640625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 16.0, 28.0, 91.0, 266.0, 1558.0, 79382.0, 958510.0, 7825.0, 601.0, 149.0, 66.0, 26.0, 16.0, 5.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.27667236328125, -4.1353759765625, -3.99407958984375, -3.852783203125, -3.71148681640625, -3.5701904296875, -3.42889404296875, -3.28759765625, -3.14630126953125, -3.0050048828125, -2.86370849609375, -2.722412109375, -2.58111572265625, -2.4398193359375, -2.29852294921875, -2.1572265625, -2.01593017578125, -1.8746337890625, -1.73333740234375, -1.592041015625, -1.45074462890625, -1.3094482421875, -1.16815185546875, -1.02685546875, -0.88555908203125, -0.7442626953125, -0.60296630859375, -0.461669921875, -0.32037353515625, -0.1790771484375, -0.03778076171875, 0.103515625, 0.24481201171875, 0.3861083984375, 0.52740478515625, 0.668701171875, 0.80999755859375, 0.9512939453125, 1.09259033203125, 1.23388671875, 1.37518310546875, 1.5164794921875, 1.65777587890625, 1.799072265625, 1.94036865234375, 2.0816650390625, 2.22296142578125, 2.3642578125, 2.50555419921875, 2.6468505859375, 2.78814697265625, 2.929443359375, 3.07073974609375, 3.2120361328125, 3.35333251953125, 3.49462890625, 3.63592529296875, 3.7772216796875, 3.91851806640625, 4.059814453125, 4.20111083984375, 4.3424072265625, 4.48370361328125, 4.625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 9.0, 9.0, 16.0, 8.0, 15.0, 12.0, 22.0, 32.0, 33.0, 48.0, 63.0, 63.0, 96.0, 113.0, 96.0, 83.0, 71.0, 53.0, 41.0, 21.0, 23.0, 18.0, 18.0, 16.0, 4.0, 6.0, 6.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013577938079833984, -0.0001304764300584793, -0.00012517347931861877, -0.00011987052857875824, -0.0001145675778388977, -0.00010926462709903717, -0.00010396167635917664, -9.86587256193161e-05, -9.335577487945557e-05, -8.805282413959503e-05, -8.27498733997345e-05, -7.744692265987396e-05, -7.214397192001343e-05, -6.684102118015289e-05, -6.153807044029236e-05, -5.6235119700431824e-05, -5.093216896057129e-05, -4.5629218220710754e-05, -4.032626748085022e-05, -3.5023316740989685e-05, -2.972036600112915e-05, -2.4417415261268616e-05, -1.911446452140808e-05, -1.3811513781547546e-05, -8.508563041687012e-06, -3.205612301826477e-06, 2.0973384380340576e-06, 7.400289177894592e-06, 1.2703239917755127e-05, 1.800619065761566e-05, 2.3309141397476196e-05, 2.861209213733673e-05, 3.3915042877197266e-05, 3.92179936170578e-05, 4.4520944356918335e-05, 4.982389509677887e-05, 5.5126845836639404e-05, 6.042979657649994e-05, 6.573274731636047e-05, 7.103569805622101e-05, 7.633864879608154e-05, 8.164159953594208e-05, 8.694455027580261e-05, 9.224750101566315e-05, 9.755045175552368e-05, 0.00010285340249538422, 0.00010815635323524475, 0.00011345930397510529, 0.00011876225471496582, 0.00012406520545482635, 0.0001293681561946869, 0.00013467110693454742, 0.00013997405767440796, 0.0001452770084142685, 0.00015057995915412903, 0.00015588290989398956, 0.0001611858606338501, 0.00016648881137371063, 0.00017179176211357117, 0.0001770947128534317, 0.00018239766359329224, 0.00018770061433315277, 0.0001930035650730133, 0.00019830651581287384, 0.00020360946655273438]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 25.0, 26.0, 30.0, 68.0, 111.0, 166.0, 334.0, 676.0, 1710.0, 5287.0, 20236.0, 119264.0, 657718.0, 201446.0, 30422.0, 6994.0, 2323.0, 839.0, 348.0, 205.0, 101.0, 75.0, 54.0, 35.0, 15.0, 14.0, 12.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4423828125, -1.3994903564453125, -1.356597900390625, -1.3137054443359375, -1.27081298828125, -1.2279205322265625, -1.185028076171875, -1.1421356201171875, -1.0992431640625, -1.0563507080078125, -1.013458251953125, -0.9705657958984375, -0.92767333984375, -0.8847808837890625, -0.841888427734375, -0.7989959716796875, -0.756103515625, -0.7132110595703125, -0.670318603515625, -0.6274261474609375, -0.58453369140625, -0.5416412353515625, -0.498748779296875, -0.4558563232421875, -0.4129638671875, -0.3700714111328125, -0.327178955078125, -0.2842864990234375, -0.24139404296875, -0.1985015869140625, -0.155609130859375, -0.1127166748046875, -0.06982421875, -0.0269317626953125, 0.015960693359375, 0.0588531494140625, 0.10174560546875, 0.1446380615234375, 0.187530517578125, 0.2304229736328125, 0.2733154296875, 0.3162078857421875, 0.359100341796875, 0.4019927978515625, 0.44488525390625, 0.4877777099609375, 0.530670166015625, 0.5735626220703125, 0.616455078125, 0.6593475341796875, 0.702239990234375, 0.7451324462890625, 0.78802490234375, 0.8309173583984375, 0.873809814453125, 0.9167022705078125, 0.9595947265625, 1.0024871826171875, 1.045379638671875, 1.0882720947265625, 1.13116455078125, 1.1740570068359375, 1.216949462890625, 1.2598419189453125, 1.302734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 1.0, 10.0, 15.0, 20.0, 30.0, 49.0, 59.0, 82.0, 134.0, 164.0, 129.0, 98.0, 77.0, 50.0, 33.0, 19.0, 8.0, 12.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82958984375, -0.8021926879882812, -0.7747955322265625, -0.7473983764648438, -0.720001220703125, -0.6926040649414062, -0.6652069091796875, -0.6378097534179688, -0.61041259765625, -0.5830154418945312, -0.5556182861328125, -0.5282211303710938, -0.500823974609375, -0.47342681884765625, -0.4460296630859375, -0.41863250732421875, -0.3912353515625, -0.36383819580078125, -0.3364410400390625, -0.30904388427734375, -0.281646728515625, -0.25424957275390625, -0.2268524169921875, -0.19945526123046875, -0.17205810546875, -0.14466094970703125, -0.1172637939453125, -0.08986663818359375, -0.062469482421875, -0.03507232666015625, -0.0076751708984375, 0.01972198486328125, 0.047119140625, 0.07451629638671875, 0.1019134521484375, 0.12931060791015625, 0.156707763671875, 0.18410491943359375, 0.2115020751953125, 0.23889923095703125, 0.26629638671875, 0.29369354248046875, 0.3210906982421875, 0.34848785400390625, 0.375885009765625, 0.40328216552734375, 0.4306793212890625, 0.45807647705078125, 0.4854736328125, 0.5128707885742188, 0.5402679443359375, 0.5676651000976562, 0.595062255859375, 0.6224594116210938, 0.6498565673828125, 0.6772537231445312, 0.70465087890625, 0.7320480346679688, 0.7594451904296875, 0.7868423461914062, 0.814239501953125, 0.8416366577148438, 0.8690338134765625, 0.8964309692382812, 0.923828125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 10.0, 16.0, 45.0, 124.0, 269.0, 311.0, 152.0, 47.0, 24.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.645073890686035, -6.574057579040527, -5.503040790557861, -4.432024002075195, -3.3610076904296875, -2.2899913787841797, -1.2189745903015137, -0.14795780181884766, 0.9230585098266602, 1.994075059890747, 3.065091609954834, 4.1361083984375, 5.207124710083008, 6.278141021728516, 7.349157810211182, 8.420174598693848, 9.491190910339355, 10.562207221984863, 11.633224487304688, 12.704240798950195, 13.775257110595703, 14.846273422241211, 15.917289733886719, 16.98830795288086, 18.059322357177734, 19.130338668823242, 20.20135498046875, 21.272371292114258, 22.343387603759766, 23.414405822753906, 24.485422134399414, 25.556438446044922, 26.627452850341797, 27.698469161987305, 28.769485473632812, 29.84050178527832, 30.911518096923828, 31.98253631591797, 33.053550720214844, 34.124568939208984, 35.195587158203125, 36.266605377197266, 37.33761978149414, 38.40863800048828, 39.479652404785156, 40.5506706237793, 41.62168502807617, 42.69270324707031, 43.76371765136719, 44.83473587036133, 45.9057502746582, 46.976768493652344, 48.04778289794922, 49.11880111694336, 50.189815521240234, 51.260833740234375, 52.33184814453125, 53.40286636352539, 54.473880767822266, 55.544898986816406, 56.61591339111328, 57.68693161010742, 58.7579460144043, 59.82896423339844, 60.89998245239258]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 8.0, 0.0, 7.0, 7.0, 11.0, 12.0, 16.0, 12.0, 10.0, 26.0, 26.0, 33.0, 18.0, 26.0, 32.0, 28.0, 33.0, 58.0, 40.0, 51.0, 32.0, 51.0, 54.0, 31.0, 41.0, 46.0, 38.0, 38.0, 30.0, 23.0, 23.0, 35.0, 20.0, 19.0, 8.0, 9.0, 7.0, 17.0, 9.0, 10.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-17.096542358398438, -16.643341064453125, -16.190139770507812, -15.736936569213867, -15.283735275268555, -14.830533981323242, -14.377331733703613, -13.924129486083984, -13.470928192138672, -13.01772689819336, -12.56452465057373, -12.111322402954102, -11.658121109008789, -11.204919815063477, -10.751717567443848, -10.298515319824219, -9.845314025878906, -9.392112731933594, -8.938910484313965, -8.485708236694336, -8.032506942749023, -7.579305171966553, -7.126103401184082, -6.672901630401611, -6.219699859619141, -5.76649808883667, -5.313296318054199, -4.8600945472717285, -4.406892776489258, -3.953691005706787, -3.5004892349243164, -3.0472874641418457, -2.5940847396850586, -2.140882968902588, -1.6876811981201172, -1.2344794273376465, -0.7812776565551758, -0.3280758857727051, 0.12512588500976562, 0.5783276557922363, 1.031529426574707, 1.4847311973571777, 1.9379329681396484, 2.391134738922119, 2.84433650970459, 3.2975382804870605, 3.7507400512695312, 4.203941822052002, 4.657143592834473, 5.110345363616943, 5.563547134399414, 6.016748905181885, 6.4699506759643555, 6.923152446746826, 7.376354217529297, 7.829555988311768, 8.282757759094238, 8.735960006713867, 9.18916130065918, 9.642362594604492, 10.095564842224121, 10.54876708984375, 11.001968383789062, 11.455169677734375, 11.908371925354004]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 18.0, 29.0, 47.0, 87.0, 187.0, 330.0, 667.0, 1896.0, 6278.0, 29272.0, 669266.0, 3379883.0, 90277.0, 11240.0, 2803.0, 1063.0, 409.0, 207.0, 131.0, 58.0, 40.0, 30.0, 19.0, 4.0, 5.0, 5.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -7.9610595703125, -7.586181640625, -7.2113037109375, -6.83642578125, -6.4615478515625, -6.086669921875, -5.7117919921875, -5.3369140625, -4.9620361328125, -4.587158203125, -4.2122802734375, -3.83740234375, -3.4625244140625, -3.087646484375, -2.7127685546875, -2.337890625, -1.9630126953125, -1.588134765625, -1.2132568359375, -0.83837890625, -0.4635009765625, -0.088623046875, 0.2862548828125, 0.6611328125, 1.0360107421875, 1.410888671875, 1.7857666015625, 2.16064453125, 2.5355224609375, 2.910400390625, 3.2852783203125, 3.66015625, 4.0350341796875, 4.409912109375, 4.7847900390625, 5.15966796875, 5.5345458984375, 5.909423828125, 6.2843017578125, 6.6591796875, 7.0340576171875, 7.408935546875, 7.7838134765625, 8.15869140625, 8.5335693359375, 8.908447265625, 9.2833251953125, 9.658203125, 10.0330810546875, 10.407958984375, 10.7828369140625, 11.15771484375, 11.5325927734375, 11.907470703125, 12.2823486328125, 12.6572265625, 13.0321044921875, 13.406982421875, 13.7818603515625, 14.15673828125, 14.5316162109375, 14.906494140625, 15.2813720703125, 15.65625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 9.0, 17.0, 26.0, 42.0, 40.0, 62.0, 67.0, 77.0, 93.0, 101.0, 107.0, 74.0, 69.0, 63.0, 48.0, 23.0, 32.0, 10.0, 10.0, 9.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3515625, -6.1365966796875, -5.921630859375, -5.7066650390625, -5.49169921875, -5.2767333984375, -5.061767578125, -4.8468017578125, -4.6318359375, -4.4168701171875, -4.201904296875, -3.9869384765625, -3.77197265625, -3.5570068359375, -3.342041015625, -3.1270751953125, -2.912109375, -2.6971435546875, -2.482177734375, -2.2672119140625, -2.05224609375, -1.8372802734375, -1.622314453125, -1.4073486328125, -1.1923828125, -0.9774169921875, -0.762451171875, -0.5474853515625, -0.33251953125, -0.1175537109375, 0.097412109375, 0.3123779296875, 0.52734375, 0.7423095703125, 0.957275390625, 1.1722412109375, 1.38720703125, 1.6021728515625, 1.817138671875, 2.0321044921875, 2.2470703125, 2.4620361328125, 2.677001953125, 2.8919677734375, 3.10693359375, 3.3218994140625, 3.536865234375, 3.7518310546875, 3.966796875, 4.1817626953125, 4.396728515625, 4.6116943359375, 4.82666015625, 5.0416259765625, 5.256591796875, 5.4715576171875, 5.6865234375, 5.9014892578125, 6.116455078125, 6.3314208984375, 6.54638671875, 6.7613525390625, 6.976318359375, 7.1912841796875, 7.40625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 14.0, 15.0, 22.0, 32.0, 62.0, 88.0, 216.0, 493.0, 1394.0, 6163.0, 52155.0, 3349963.0, 753489.0, 24768.0, 3682.0, 955.0, 362.0, 163.0, 70.0, 51.0, 31.0, 19.0, 19.0, 6.0, 5.0, 5.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.29443359375, -9.9248046875, -9.55517578125, -9.185546875, -8.81591796875, -8.4462890625, -8.07666015625, -7.70703125, -7.33740234375, -6.9677734375, -6.59814453125, -6.228515625, -5.85888671875, -5.4892578125, -5.11962890625, -4.75, -4.38037109375, -4.0107421875, -3.64111328125, -3.271484375, -2.90185546875, -2.5322265625, -2.16259765625, -1.79296875, -1.42333984375, -1.0537109375, -0.68408203125, -0.314453125, 0.05517578125, 0.4248046875, 0.79443359375, 1.1640625, 1.53369140625, 1.9033203125, 2.27294921875, 2.642578125, 3.01220703125, 3.3818359375, 3.75146484375, 4.12109375, 4.49072265625, 4.8603515625, 5.22998046875, 5.599609375, 5.96923828125, 6.3388671875, 6.70849609375, 7.078125, 7.44775390625, 7.8173828125, 8.18701171875, 8.556640625, 8.92626953125, 9.2958984375, 9.66552734375, 10.03515625, 10.40478515625, 10.7744140625, 11.14404296875, 11.513671875, 11.88330078125, 12.2529296875, 12.62255859375, 12.9921875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 13.0, 16.0, 22.0, 34.0, 37.0, 59.0, 89.0, 145.0, 250.0, 436.0, 792.0, 849.0, 544.0, 275.0, 169.0, 100.0, 79.0, 46.0, 34.0, 18.0, 16.0, 8.0, 8.0, 9.0, 2.0, 4.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05859375, -1.987762451171875, -1.91693115234375, -1.846099853515625, -1.7752685546875, -1.704437255859375, -1.63360595703125, -1.562774658203125, -1.491943359375, -1.421112060546875, -1.35028076171875, -1.279449462890625, -1.2086181640625, -1.137786865234375, -1.06695556640625, -0.996124267578125, -0.92529296875, -0.854461669921875, -0.78363037109375, -0.712799072265625, -0.6419677734375, -0.571136474609375, -0.50030517578125, -0.429473876953125, -0.358642578125, -0.287811279296875, -0.21697998046875, -0.146148681640625, -0.0753173828125, -0.004486083984375, 0.06634521484375, 0.137176513671875, 0.2080078125, 0.278839111328125, 0.34967041015625, 0.420501708984375, 0.4913330078125, 0.562164306640625, 0.63299560546875, 0.703826904296875, 0.774658203125, 0.845489501953125, 0.91632080078125, 0.987152099609375, 1.0579833984375, 1.128814697265625, 1.19964599609375, 1.270477294921875, 1.34130859375, 1.412139892578125, 1.48297119140625, 1.553802490234375, 1.6246337890625, 1.695465087890625, 1.76629638671875, 1.837127685546875, 1.907958984375, 1.978790283203125, 2.04962158203125, 2.120452880859375, 2.1912841796875, 2.262115478515625, 2.33294677734375, 2.403778076171875, 2.474609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 23.0, 34.0, 60.0, 84.0, 177.0, 193.0, 167.0, 119.0, 77.0, 26.0, 16.0, 13.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.969508171081543, -5.497320652008057, -5.02513313293457, -4.552945137023926, -4.0807576179504395, -3.608570098876953, -3.1363823413848877, -2.6641945838928223, -2.192007064819336, -1.71981942653656, -1.2476317882537842, -0.7754441499710083, -0.3032565116882324, 0.1689310073852539, 0.6411187648773193, 1.1133065223693848, 1.585494041442871, 2.0576815605163574, 2.529869318008423, 3.0020570755004883, 3.4742445945739746, 3.946432113647461, 4.4186201095581055, 4.890807628631592, 5.362995147705078, 5.8351826667785645, 6.307370185852051, 6.779558181762695, 7.251745700836182, 7.723933219909668, 8.196121215820312, 8.66830825805664, 9.140495300292969, 9.612683296203613, 10.084870338439941, 10.557058334350586, 11.029245376586914, 11.501433372497559, 11.973621368408203, 12.445808410644531, 12.917996406555176, 13.39018440246582, 13.862371444702148, 14.334559440612793, 14.806747436523438, 15.278934478759766, 15.75112247467041, 16.223310470581055, 16.695497512817383, 17.16768455505371, 17.639873504638672, 18.112060546875, 18.584247589111328, 19.056434631347656, 19.528623580932617, 20.000810623168945, 20.472999572753906, 20.945186614990234, 21.417375564575195, 21.889562606811523, 22.36174964904785, 22.833938598632812, 23.30612564086914, 23.77831268310547, 24.250499725341797]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 10.0, 11.0, 10.0, 19.0, 24.0, 26.0, 38.0, 45.0, 40.0, 33.0, 61.0, 35.0, 70.0, 67.0, 53.0, 61.0, 55.0, 64.0, 48.0, 44.0, 41.0, 29.0, 24.0, 18.0, 20.0, 16.0, 8.0, 7.0, 10.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.938656806945801, -4.764148235321045, -4.589639663696289, -4.415131092071533, -4.240622520446777, -4.066113471984863, -3.8916049003601074, -3.7170963287353516, -3.5425877571105957, -3.36807918548584, -3.193570613861084, -3.019061803817749, -2.844553232192993, -2.6700446605682373, -2.4955358505249023, -2.3210272789001465, -2.1465187072753906, -1.9720101356506348, -1.7975014448165894, -1.622992753982544, -1.448484182357788, -1.2739756107330322, -1.0994669198989868, -0.9249582290649414, -0.7504496574401855, -0.5759410262107849, -0.4014323949813843, -0.22692376375198364, -0.05241513252258301, 0.12209349870681763, 0.29660212993621826, 0.47111082077026367, 0.6456198692321777, 0.8201285004615784, 0.994637131690979, 1.1691458225250244, 1.3436543941497803, 1.5181629657745361, 1.6926716566085815, 1.867180347442627, 2.041688919067383, 2.2161974906921387, 2.3907060623168945, 2.5652148723602295, 2.7397234439849854, 2.914232015609741, 3.088740825653076, 3.263249397277832, 3.437757968902588, 3.6122665405273438, 3.7867751121520996, 3.9612839221954346, 4.1357927322387695, 4.310301303863525, 4.484809875488281, 4.659318447113037, 4.833827018737793, 5.008335590362549, 5.182844161987305, 5.3573527336120605, 5.531861305236816, 5.7063703536987305, 5.880878925323486, 6.055387496948242, 6.229896068572998]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 8.0, 14.0, 20.0, 28.0, 38.0, 66.0, 121.0, 187.0, 345.0, 676.0, 1224.0, 2621.0, 6033.0, 15705.0, 50563.0, 213755.0, 502354.0, 185350.0, 44557.0, 14248.0, 5638.0, 2447.0, 1168.0, 582.0, 328.0, 161.0, 103.0, 69.0, 39.0, 39.0, 17.0, 12.0, 15.0, 7.0, 2.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.4781341552734375, -1.427947998046875, -1.3777618408203125, -1.32757568359375, -1.2773895263671875, -1.227203369140625, -1.1770172119140625, -1.1268310546875, -1.0766448974609375, -1.026458740234375, -0.9762725830078125, -0.92608642578125, -0.8759002685546875, -0.825714111328125, -0.7755279541015625, -0.725341796875, -0.6751556396484375, -0.624969482421875, -0.5747833251953125, -0.52459716796875, -0.4744110107421875, -0.424224853515625, -0.3740386962890625, -0.3238525390625, -0.2736663818359375, -0.223480224609375, -0.1732940673828125, -0.12310791015625, -0.0729217529296875, -0.022735595703125, 0.0274505615234375, 0.07763671875, 0.1278228759765625, 0.178009033203125, 0.2281951904296875, 0.27838134765625, 0.3285675048828125, 0.378753662109375, 0.4289398193359375, 0.4791259765625, 0.5293121337890625, 0.579498291015625, 0.6296844482421875, 0.67987060546875, 0.7300567626953125, 0.780242919921875, 0.8304290771484375, 0.880615234375, 0.9308013916015625, 0.980987548828125, 1.0311737060546875, 1.08135986328125, 1.1315460205078125, 1.181732177734375, 1.2319183349609375, 1.2821044921875, 1.3322906494140625, 1.382476806640625, 1.4326629638671875, 1.48284912109375, 1.5330352783203125, 1.583221435546875, 1.6334075927734375, 1.68359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 5.0, 9.0, 19.0, 17.0, 28.0, 34.0, 44.0, 45.0, 41.0, 61.0, 87.0, 73.0, 76.0, 64.0, 87.0, 54.0, 54.0, 35.0, 41.0, 27.0, 34.0, 20.0, 15.0, 6.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.304779052734375, -3.17010498046875, -3.035430908203125, -2.9007568359375, -2.766082763671875, -2.63140869140625, -2.496734619140625, -2.362060546875, -2.227386474609375, -2.09271240234375, -1.958038330078125, -1.8233642578125, -1.688690185546875, -1.55401611328125, -1.419342041015625, -1.28466796875, -1.149993896484375, -1.01531982421875, -0.880645751953125, -0.7459716796875, -0.611297607421875, -0.47662353515625, -0.341949462890625, -0.207275390625, -0.072601318359375, 0.06207275390625, 0.196746826171875, 0.3314208984375, 0.466094970703125, 0.60076904296875, 0.735443115234375, 0.8701171875, 1.004791259765625, 1.13946533203125, 1.274139404296875, 1.4088134765625, 1.543487548828125, 1.67816162109375, 1.812835693359375, 1.947509765625, 2.082183837890625, 2.21685791015625, 2.351531982421875, 2.4862060546875, 2.620880126953125, 2.75555419921875, 2.890228271484375, 3.02490234375, 3.159576416015625, 3.29425048828125, 3.428924560546875, 3.5635986328125, 3.698272705078125, 3.83294677734375, 3.967620849609375, 4.102294921875, 4.236968994140625, 4.37164306640625, 4.506317138671875, 4.6409912109375, 4.775665283203125, 4.91033935546875, 5.045013427734375, 5.1796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 8.0, 8.0, 16.0, 24.0, 27.0, 50.0, 71.0, 153.0, 341.0, 696.0, 1866.0, 5506.0, 20801.0, 130774.0, 652388.0, 197260.0, 27712.0, 6939.0, 2217.0, 855.0, 369.0, 177.0, 105.0, 62.0, 27.0, 21.0, 20.0, 10.0, 11.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126953125, -2.05963134765625, -1.9923095703125, -1.92498779296875, -1.857666015625, -1.79034423828125, -1.7230224609375, -1.65570068359375, -1.58837890625, -1.52105712890625, -1.4537353515625, -1.38641357421875, -1.319091796875, -1.25177001953125, -1.1844482421875, -1.11712646484375, -1.0498046875, -0.98248291015625, -0.9151611328125, -0.84783935546875, -0.780517578125, -0.71319580078125, -0.6458740234375, -0.57855224609375, -0.51123046875, -0.44390869140625, -0.3765869140625, -0.30926513671875, -0.241943359375, -0.17462158203125, -0.1072998046875, -0.03997802734375, 0.02734375, 0.09466552734375, 0.1619873046875, 0.22930908203125, 0.296630859375, 0.36395263671875, 0.4312744140625, 0.49859619140625, 0.56591796875, 0.63323974609375, 0.7005615234375, 0.76788330078125, 0.835205078125, 0.90252685546875, 0.9698486328125, 1.03717041015625, 1.1044921875, 1.17181396484375, 1.2391357421875, 1.30645751953125, 1.373779296875, 1.44110107421875, 1.5084228515625, 1.57574462890625, 1.64306640625, 1.71038818359375, 1.7777099609375, 1.84503173828125, 1.912353515625, 1.97967529296875, 2.0469970703125, 2.11431884765625, 2.181640625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 7.0, 7.0, 6.0, 9.0, 13.0, 14.0, 15.0, 28.0, 25.0, 28.0, 30.0, 39.0, 37.0, 41.0, 38.0, 45.0, 35.0, 44.0, 41.0, 43.0, 43.0, 39.0, 27.0, 48.0, 37.0, 30.0, 35.0, 30.0, 19.0, 21.0, 20.0, 15.0, 17.0, 18.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-5.25, -5.08636474609375, -4.9227294921875, -4.75909423828125, -4.595458984375, -4.43182373046875, -4.2681884765625, -4.10455322265625, -3.94091796875, -3.77728271484375, -3.6136474609375, -3.45001220703125, -3.286376953125, -3.12274169921875, -2.9591064453125, -2.79547119140625, -2.6318359375, -2.46820068359375, -2.3045654296875, -2.14093017578125, -1.977294921875, -1.81365966796875, -1.6500244140625, -1.48638916015625, -1.32275390625, -1.15911865234375, -0.9954833984375, -0.83184814453125, -0.668212890625, -0.50457763671875, -0.3409423828125, -0.17730712890625, -0.013671875, 0.14996337890625, 0.3135986328125, 0.47723388671875, 0.640869140625, 0.80450439453125, 0.9681396484375, 1.13177490234375, 1.29541015625, 1.45904541015625, 1.6226806640625, 1.78631591796875, 1.949951171875, 2.11358642578125, 2.2772216796875, 2.44085693359375, 2.6044921875, 2.76812744140625, 2.9317626953125, 3.09539794921875, 3.259033203125, 3.42266845703125, 3.5863037109375, 3.74993896484375, 3.91357421875, 4.07720947265625, 4.2408447265625, 4.40447998046875, 4.568115234375, 4.73175048828125, 4.8953857421875, 5.05902099609375, 5.22265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 8.0, 7.0, 15.0, 13.0, 16.0, 18.0, 38.0, 72.0, 113.0, 223.0, 397.0, 796.0, 1691.0, 4230.0, 12216.0, 56211.0, 433256.0, 458150.0, 60073.0, 12889.0, 4432.0, 1847.0, 862.0, 418.0, 209.0, 142.0, 69.0, 37.0, 39.0, 18.0, 11.0, 13.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.8984375, -0.8703765869140625, -0.842315673828125, -0.8142547607421875, -0.78619384765625, -0.7581329345703125, -0.730072021484375, -0.7020111083984375, -0.6739501953125, -0.6458892822265625, -0.617828369140625, -0.5897674560546875, -0.56170654296875, -0.5336456298828125, -0.505584716796875, -0.4775238037109375, -0.449462890625, -0.4214019775390625, -0.393341064453125, -0.3652801513671875, -0.33721923828125, -0.3091583251953125, -0.281097412109375, -0.2530364990234375, -0.2249755859375, -0.1969146728515625, -0.168853759765625, -0.1407928466796875, -0.11273193359375, -0.0846710205078125, -0.056610107421875, -0.0285491943359375, -0.00048828125, 0.0275726318359375, 0.055633544921875, 0.0836944580078125, 0.11175537109375, 0.1398162841796875, 0.167877197265625, 0.1959381103515625, 0.2239990234375, 0.2520599365234375, 0.280120849609375, 0.3081817626953125, 0.33624267578125, 0.3643035888671875, 0.392364501953125, 0.4204254150390625, 0.448486328125, 0.4765472412109375, 0.504608154296875, 0.5326690673828125, 0.56072998046875, 0.5887908935546875, 0.616851806640625, 0.6449127197265625, 0.6729736328125, 0.7010345458984375, 0.729095458984375, 0.7571563720703125, 0.78521728515625, 0.8132781982421875, 0.841339111328125, 0.8694000244140625, 0.8974609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 8.0, 17.0, 18.0, 30.0, 47.0, 47.0, 101.0, 121.0, 129.0, 126.0, 105.0, 58.0, 48.0, 32.0, 18.0, 14.0, 14.0, 11.0, 3.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004360675811767578, -0.0004231072962284088, -0.0004101470112800598, -0.0003971867263317108, -0.0003842264413833618, -0.0003712661564350128, -0.0003583058714866638, -0.0003453455865383148, -0.0003323853015899658, -0.0003194250166416168, -0.0003064647316932678, -0.0002935044467449188, -0.0002805441617965698, -0.0002675838768482208, -0.0002546235918998718, -0.00024166330695152283, -0.00022870302200317383, -0.00021574273705482483, -0.00020278245210647583, -0.00018982216715812683, -0.00017686188220977783, -0.00016390159726142883, -0.00015094131231307983, -0.00013798102736473083, -0.00012502074241638184, -0.00011206045746803284, -9.910017251968384e-05, -8.613988757133484e-05, -7.317960262298584e-05, -6.021931767463684e-05, -4.725903272628784e-05, -3.429874777793884e-05, -2.1338462829589844e-05, -8.378177881240845e-06, 4.582107067108154e-06, 1.7542392015457153e-05, 3.0502676963806152e-05, 4.346296191215515e-05, 5.642324686050415e-05, 6.938353180885315e-05, 8.234381675720215e-05, 9.530410170555115e-05, 0.00010826438665390015, 0.00012122467160224915, 0.00013418495655059814, 0.00014714524149894714, 0.00016010552644729614, 0.00017306581139564514, 0.00018602609634399414, 0.00019898638129234314, 0.00021194666624069214, 0.00022490695118904114, 0.00023786723613739014, 0.00025082752108573914, 0.00026378780603408813, 0.00027674809098243713, 0.00028970837593078613, 0.00030266866087913513, 0.00031562894582748413, 0.00032858923077583313, 0.00034154951572418213, 0.00035450980067253113, 0.0003674700856208801, 0.0003804303705692291, 0.0003933906555175781]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 3.0, 10.0, 6.0, 13.0, 20.0, 30.0, 29.0, 52.0, 79.0, 108.0, 192.0, 301.0, 568.0, 830.0, 1529.0, 2950.0, 5742.0, 12144.0, 29917.0, 82931.0, 262694.0, 397856.0, 160376.0, 52044.0, 19996.0, 8685.0, 4203.0, 2172.0, 1204.0, 673.0, 430.0, 266.0, 159.0, 105.0, 66.0, 61.0, 34.0, 20.0, 14.0, 11.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.60205078125, -0.5854568481445312, -0.5688629150390625, -0.5522689819335938, -0.535675048828125, -0.5190811157226562, -0.5024871826171875, -0.48589324951171875, -0.46929931640625, -0.45270538330078125, -0.4361114501953125, -0.41951751708984375, -0.402923583984375, -0.38632965087890625, -0.3697357177734375, -0.35314178466796875, -0.3365478515625, -0.31995391845703125, -0.3033599853515625, -0.28676605224609375, -0.270172119140625, -0.25357818603515625, -0.2369842529296875, -0.22039031982421875, -0.20379638671875, -0.18720245361328125, -0.1706085205078125, -0.15401458740234375, -0.137420654296875, -0.12082672119140625, -0.1042327880859375, -0.08763885498046875, -0.071044921875, -0.05445098876953125, -0.0378570556640625, -0.02126312255859375, -0.004669189453125, 0.01192474365234375, 0.0285186767578125, 0.04511260986328125, 0.06170654296875, 0.07830047607421875, 0.0948944091796875, 0.11148834228515625, 0.128082275390625, 0.14467620849609375, 0.1612701416015625, 0.17786407470703125, 0.1944580078125, 0.21105194091796875, 0.2276458740234375, 0.24423980712890625, 0.260833740234375, 0.27742767333984375, 0.2940216064453125, 0.31061553955078125, 0.32720947265625, 0.34380340576171875, 0.3603973388671875, 0.37699127197265625, 0.393585205078125, 0.41017913818359375, 0.4267730712890625, 0.44336700439453125, 0.4599609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 5.0, 9.0, 8.0, 9.0, 6.0, 9.0, 16.0, 9.0, 22.0, 26.0, 43.0, 38.0, 40.0, 67.0, 63.0, 57.0, 80.0, 71.0, 78.0, 70.0, 44.0, 48.0, 32.0, 34.0, 16.0, 15.0, 14.0, 12.0, 8.0, 9.0, 8.0, 7.0, 6.0, 4.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.14018630981445312, -0.13498687744140625, -0.12978744506835938, -0.1245880126953125, -0.11938858032226562, -0.11418914794921875, -0.10898971557617188, -0.103790283203125, -0.09859085083007812, -0.09339141845703125, -0.08819198608398438, -0.0829925537109375, -0.07779312133789062, -0.07259368896484375, -0.06739425659179688, -0.06219482421875, -0.056995391845703125, -0.05179595947265625, -0.046596527099609375, -0.0413970947265625, -0.036197662353515625, -0.03099822998046875, -0.025798797607421875, -0.020599365234375, -0.015399932861328125, -0.01020050048828125, -0.005001068115234375, 0.0001983642578125, 0.005397796630859375, 0.01059722900390625, 0.015796661376953125, 0.02099609375, 0.026195526123046875, 0.03139495849609375, 0.036594390869140625, 0.0417938232421875, 0.046993255615234375, 0.05219268798828125, 0.057392120361328125, 0.062591552734375, 0.06779098510742188, 0.07299041748046875, 0.07818984985351562, 0.0833892822265625, 0.08858871459960938, 0.09378814697265625, 0.09898757934570312, 0.10418701171875, 0.10938644409179688, 0.11458587646484375, 0.11978530883789062, 0.1249847412109375, 0.13018417358398438, 0.13538360595703125, 0.14058303833007812, 0.145782470703125, 0.15098190307617188, 0.15618133544921875, 0.16138076782226562, 0.1665802001953125, 0.17177963256835938, 0.17697906494140625, 0.18217849731445312, 0.1873779296875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 23.0, 54.0, 111.0, 244.0, 275.0, 172.0, 68.0, 30.0, 12.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.353297233581543, -7.940892696380615, -7.528488636016846, -7.116084098815918, -6.703680038452148, -6.291275501251221, -5.878870964050293, -5.466466903686523, -5.054062366485596, -4.641657829284668, -4.229253768920898, -3.8168492317199707, -3.404444932937622, -2.9920406341552734, -2.5796360969543457, -2.167231798171997, -1.7548274993896484, -1.3424232006072998, -0.9300187826156616, -0.5176143646240234, -0.1052100658416748, 0.30719423294067383, 0.7195987701416016, 1.1320030689239502, 1.5444073677062988, 1.9568116664886475, 2.369215965270996, 2.781620502471924, 3.1940248012542725, 3.606429100036621, 4.018833637237549, 4.431238174438477, 4.8436431884765625, 5.25604772567749, 5.66845178604126, 6.0808563232421875, 6.493260383605957, 6.905664920806885, 7.3180694580078125, 7.730473518371582, 8.142877578735352, 8.555281639099121, 8.967686653137207, 9.380090713500977, 9.792494773864746, 10.204898834228516, 10.617303848266602, 11.029707908630371, 11.442112922668457, 11.854516983032227, 12.266921997070312, 12.679326057434082, 13.091730117797852, 13.504135131835938, 13.916539192199707, 14.328943252563477, 14.741348266601562, 15.153752326965332, 15.566157341003418, 15.978561401367188, 16.390966415405273, 16.803369522094727, 17.215774536132812, 17.6281795501709, 18.04058265686035]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 5.0, 3.0, 9.0, 12.0, 19.0, 17.0, 24.0, 39.0, 36.0, 37.0, 51.0, 43.0, 60.0, 70.0, 68.0, 59.0, 66.0, 63.0, 73.0, 50.0, 42.0, 34.0, 30.0, 26.0, 21.0, 11.0, 6.0, 15.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431551694869995, -3.312861919403076, -3.194171905517578, -3.075482130050659, -2.9567923545837402, -2.838102340698242, -2.7194125652313232, -2.6007227897644043, -2.4820327758789062, -2.3633430004119873, -2.2446529865264893, -2.1259632110595703, -2.0072734355926514, -1.8885835409164429, -1.7698936462402344, -1.6512038707733154, -1.5325140953063965, -1.413824200630188, -1.295134425163269, -1.1764445304870605, -1.0577547550201416, -0.9390648603439331, -0.8203749656677246, -0.7016851305961609, -0.5829952955245972, -0.46430546045303345, -0.34561559557914734, -0.22692573070526123, -0.10823589563369751, 0.010453939437866211, 0.1291438341140747, 0.24783366918563843, 0.36652374267578125, 0.48521357774734497, 0.6039034128189087, 0.7225933074951172, 0.8412831425666809, 0.9599729776382446, 1.0786628723144531, 1.197352647781372, 1.3160425424575806, 1.434732437133789, 1.553422212600708, 1.6721121072769165, 1.790802001953125, 1.909491777420044, 2.028181552886963, 2.146871566772461, 2.26556134223938, 2.384251117706299, 2.502941131591797, 2.621630907058716, 2.7403206825256348, 2.859010696411133, 2.9777004718780518, 3.0963902473449707, 3.2150802612304688, 3.3337700366973877, 3.4524600505828857, 3.5711498260498047, 3.6898396015167236, 3.8085293769836426, 3.9272193908691406, 4.045909404754639, 4.1645989418029785]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 8.0, 18.0, 32.0, 59.0, 84.0, 201.0, 384.0, 873.0, 2041.0, 5869.0, 21124.0, 139934.0, 774280.0, 80834.0, 15236.0, 4493.0, 1714.0, 714.0, 313.0, 153.0, 74.0, 52.0, 19.0, 12.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.309326171875, -4.14599609375, -3.982666015625, -3.8193359375, -3.656005859375, -3.49267578125, -3.329345703125, -3.166015625, -3.002685546875, -2.83935546875, -2.676025390625, -2.5126953125, -2.349365234375, -2.18603515625, -2.022705078125, -1.859375, -1.696044921875, -1.53271484375, -1.369384765625, -1.2060546875, -1.042724609375, -0.87939453125, -0.716064453125, -0.552734375, -0.389404296875, -0.22607421875, -0.062744140625, 0.1005859375, 0.263916015625, 0.42724609375, 0.590576171875, 0.75390625, 0.917236328125, 1.08056640625, 1.243896484375, 1.4072265625, 1.570556640625, 1.73388671875, 1.897216796875, 2.060546875, 2.223876953125, 2.38720703125, 2.550537109375, 2.7138671875, 2.877197265625, 3.04052734375, 3.203857421875, 3.3671875, 3.530517578125, 3.69384765625, 3.857177734375, 4.0205078125, 4.183837890625, 4.34716796875, 4.510498046875, 4.673828125, 4.837158203125, 5.00048828125, 5.163818359375, 5.3271484375, 5.490478515625, 5.65380859375, 5.817138671875, 5.98046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 4.0, 12.0, 17.0, 15.0, 18.0, 36.0, 38.0, 37.0, 39.0, 45.0, 63.0, 70.0, 68.0, 63.0, 61.0, 61.0, 67.0, 58.0, 49.0, 37.0, 32.0, 24.0, 25.0, 14.0, 9.0, 10.0, 6.0, 5.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.453125, -7.2071533203125, -6.961181640625, -6.7152099609375, -6.46923828125, -6.2232666015625, -5.977294921875, -5.7313232421875, -5.4853515625, -5.2393798828125, -4.993408203125, -4.7474365234375, -4.50146484375, -4.2554931640625, -4.009521484375, -3.7635498046875, -3.517578125, -3.2716064453125, -3.025634765625, -2.7796630859375, -2.53369140625, -2.2877197265625, -2.041748046875, -1.7957763671875, -1.5498046875, -1.3038330078125, -1.057861328125, -0.8118896484375, -0.56591796875, -0.3199462890625, -0.073974609375, 0.1719970703125, 0.41796875, 0.6639404296875, 0.909912109375, 1.1558837890625, 1.40185546875, 1.6478271484375, 1.893798828125, 2.1397705078125, 2.3857421875, 2.6317138671875, 2.877685546875, 3.1236572265625, 3.36962890625, 3.6156005859375, 3.861572265625, 4.1075439453125, 4.353515625, 4.5994873046875, 4.845458984375, 5.0914306640625, 5.33740234375, 5.5833740234375, 5.829345703125, 6.0753173828125, 6.3212890625, 6.5672607421875, 6.813232421875, 7.0592041015625, 7.30517578125, 7.5511474609375, 7.797119140625, 8.0430908203125, 8.2890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 14.0, 10.0, 17.0, 22.0, 14.0, 15.0, 25.0, 36.0, 62.0, 75.0, 94.0, 211.0, 1007.0, 14149.0, 944753.0, 84540.0, 2729.0, 357.0, 118.0, 59.0, 53.0, 41.0, 22.0, 26.0, 18.0, 14.0, 12.0, 12.0, 13.0, 6.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.1519775390625, -11.780517578125, -11.4090576171875, -11.03759765625, -10.6661376953125, -10.294677734375, -9.9232177734375, -9.5517578125, -9.1802978515625, -8.808837890625, -8.4373779296875, -8.06591796875, -7.6944580078125, -7.322998046875, -6.9515380859375, -6.580078125, -6.2086181640625, -5.837158203125, -5.4656982421875, -5.09423828125, -4.7227783203125, -4.351318359375, -3.9798583984375, -3.6083984375, -3.2369384765625, -2.865478515625, -2.4940185546875, -2.12255859375, -1.7510986328125, -1.379638671875, -1.0081787109375, -0.63671875, -0.2652587890625, 0.106201171875, 0.4776611328125, 0.84912109375, 1.2205810546875, 1.592041015625, 1.9635009765625, 2.3349609375, 2.7064208984375, 3.077880859375, 3.4493408203125, 3.82080078125, 4.1922607421875, 4.563720703125, 4.9351806640625, 5.306640625, 5.6781005859375, 6.049560546875, 6.4210205078125, 6.79248046875, 7.1639404296875, 7.535400390625, 7.9068603515625, 8.2783203125, 8.6497802734375, 9.021240234375, 9.3927001953125, 9.76416015625, 10.1356201171875, 10.507080078125, 10.8785400390625, 11.25]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 8.0, 6.0, 21.0, 14.0, 21.0, 19.0, 23.0, 28.0, 42.0, 41.0, 63.0, 69.0, 57.0, 57.0, 68.0, 56.0, 54.0, 46.0, 52.0, 48.0, 46.0, 34.0, 23.0, 24.0, 14.0, 11.0, 15.0, 7.0, 7.0, 7.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.4765625, -11.1708984375, -10.865234375, -10.5595703125, -10.25390625, -9.9482421875, -9.642578125, -9.3369140625, -9.03125, -8.7255859375, -8.419921875, -8.1142578125, -7.80859375, -7.5029296875, -7.197265625, -6.8916015625, -6.5859375, -6.2802734375, -5.974609375, -5.6689453125, -5.36328125, -5.0576171875, -4.751953125, -4.4462890625, -4.140625, -3.8349609375, -3.529296875, -3.2236328125, -2.91796875, -2.6123046875, -2.306640625, -2.0009765625, -1.6953125, -1.3896484375, -1.083984375, -0.7783203125, -0.47265625, -0.1669921875, 0.138671875, 0.4443359375, 0.75, 1.0556640625, 1.361328125, 1.6669921875, 1.97265625, 2.2783203125, 2.583984375, 2.8896484375, 3.1953125, 3.5009765625, 3.806640625, 4.1123046875, 4.41796875, 4.7236328125, 5.029296875, 5.3349609375, 5.640625, 5.9462890625, 6.251953125, 6.5576171875, 6.86328125, 7.1689453125, 7.474609375, 7.7802734375, 8.0859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 3.0, 7.0, 14.0, 9.0, 23.0, 15.0, 39.0, 78.0, 118.0, 272.0, 636.0, 1613.0, 5837.0, 35926.0, 578901.0, 387689.0, 29707.0, 5147.0, 1418.0, 567.0, 226.0, 138.0, 67.0, 23.0, 33.0, 13.0, 6.0, 8.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.55078125, -1.497222900390625, -1.44366455078125, -1.390106201171875, -1.3365478515625, -1.282989501953125, -1.22943115234375, -1.175872802734375, -1.122314453125, -1.068756103515625, -1.01519775390625, -0.961639404296875, -0.9080810546875, -0.854522705078125, -0.80096435546875, -0.747406005859375, -0.69384765625, -0.640289306640625, -0.58673095703125, -0.533172607421875, -0.4796142578125, -0.426055908203125, -0.37249755859375, -0.318939208984375, -0.265380859375, -0.211822509765625, -0.15826416015625, -0.104705810546875, -0.0511474609375, 0.002410888671875, 0.05596923828125, 0.109527587890625, 0.1630859375, 0.216644287109375, 0.27020263671875, 0.323760986328125, 0.3773193359375, 0.430877685546875, 0.48443603515625, 0.537994384765625, 0.591552734375, 0.645111083984375, 0.69866943359375, 0.752227783203125, 0.8057861328125, 0.859344482421875, 0.91290283203125, 0.966461181640625, 1.02001953125, 1.073577880859375, 1.12713623046875, 1.180694580078125, 1.2342529296875, 1.287811279296875, 1.34136962890625, 1.394927978515625, 1.448486328125, 1.502044677734375, 1.55560302734375, 1.609161376953125, 1.6627197265625, 1.716278076171875, 1.76983642578125, 1.823394775390625, 1.876953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 1.0, 6.0, 8.0, 8.0, 11.0, 10.0, 19.0, 28.0, 35.0, 58.0, 69.0, 85.0, 113.0, 153.0, 97.0, 70.0, 62.0, 34.0, 29.0, 22.0, 24.0, 14.0, 4.0, 6.0, 5.0, 1.0, 5.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001690387725830078, -0.00016345083713531494, -0.00015786290168762207, -0.0001522749662399292, -0.00014668703079223633, -0.00014109909534454346, -0.00013551115989685059, -0.00012992322444915771, -0.00012433528900146484, -0.00011874735355377197, -0.0001131594181060791, -0.00010757148265838623, -0.00010198354721069336, -9.639561176300049e-05, -9.080767631530762e-05, -8.521974086761475e-05, -7.963180541992188e-05, -7.4043869972229e-05, -6.845593452453613e-05, -6.286799907684326e-05, -5.728006362915039e-05, -5.169212818145752e-05, -4.610419273376465e-05, -4.051625728607178e-05, -3.4928321838378906e-05, -2.9340386390686035e-05, -2.3752450942993164e-05, -1.8164515495300293e-05, -1.2576580047607422e-05, -6.988644599914551e-06, -1.4007091522216797e-06, 4.187226295471191e-06, 9.775161743164062e-06, 1.5363097190856934e-05, 2.0951032638549805e-05, 2.6538968086242676e-05, 3.212690353393555e-05, 3.771483898162842e-05, 4.330277442932129e-05, 4.889070987701416e-05, 5.447864532470703e-05, 6.00665807723999e-05, 6.565451622009277e-05, 7.124245166778564e-05, 7.683038711547852e-05, 8.241832256317139e-05, 8.800625801086426e-05, 9.359419345855713e-05, 9.918212890625e-05, 0.00010477006435394287, 0.00011035799980163574, 0.00011594593524932861, 0.00012153387069702148, 0.00012712180614471436, 0.00013270974159240723, 0.0001382976770401001, 0.00014388561248779297, 0.00014947354793548584, 0.0001550614833831787, 0.00016064941883087158, 0.00016623735427856445, 0.00017182528972625732, 0.0001774132251739502, 0.00018300116062164307, 0.00018858909606933594]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 11.0, 8.0, 15.0, 18.0, 32.0, 41.0, 119.0, 200.0, 439.0, 917.0, 2277.0, 6734.0, 27668.0, 169963.0, 711719.0, 101295.0, 18737.0, 4976.0, 1826.0, 752.0, 373.0, 181.0, 111.0, 48.0, 31.0, 21.0, 9.0, 8.0, 11.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7548828125, -1.7103118896484375, -1.665740966796875, -1.6211700439453125, -1.57659912109375, -1.5320281982421875, -1.487457275390625, -1.4428863525390625, -1.3983154296875, -1.3537445068359375, -1.309173583984375, -1.2646026611328125, -1.22003173828125, -1.1754608154296875, -1.130889892578125, -1.0863189697265625, -1.041748046875, -0.9971771240234375, -0.952606201171875, -0.9080352783203125, -0.86346435546875, -0.8188934326171875, -0.774322509765625, -0.7297515869140625, -0.6851806640625, -0.6406097412109375, -0.596038818359375, -0.5514678955078125, -0.50689697265625, -0.4623260498046875, -0.417755126953125, -0.3731842041015625, -0.32861328125, -0.2840423583984375, -0.239471435546875, -0.1949005126953125, -0.15032958984375, -0.1057586669921875, -0.061187744140625, -0.0166168212890625, 0.0279541015625, 0.0725250244140625, 0.117095947265625, 0.1616668701171875, 0.20623779296875, 0.2508087158203125, 0.295379638671875, 0.3399505615234375, 0.384521484375, 0.4290924072265625, 0.473663330078125, 0.5182342529296875, 0.56280517578125, 0.6073760986328125, 0.651947021484375, 0.6965179443359375, 0.7410888671875, 0.7856597900390625, 0.830230712890625, 0.8748016357421875, 0.91937255859375, 0.9639434814453125, 1.008514404296875, 1.0530853271484375, 1.09765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 5.0, 1.0, 11.0, 9.0, 12.0, 15.0, 24.0, 22.0, 26.0, 41.0, 51.0, 73.0, 101.0, 147.0, 128.0, 76.0, 49.0, 50.0, 36.0, 24.0, 19.0, 7.0, 12.0, 10.0, 5.0, 7.0, 13.0, 6.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.466796875, -0.44869232177734375, -0.4305877685546875, -0.41248321533203125, -0.394378662109375, -0.37627410888671875, -0.3581695556640625, -0.34006500244140625, -0.32196044921875, -0.30385589599609375, -0.2857513427734375, -0.26764678955078125, -0.249542236328125, -0.23143768310546875, -0.2133331298828125, -0.19522857666015625, -0.1771240234375, -0.15901947021484375, -0.1409149169921875, -0.12281036376953125, -0.104705810546875, -0.08660125732421875, -0.0684967041015625, -0.05039215087890625, -0.03228759765625, -0.01418304443359375, 0.0039215087890625, 0.02202606201171875, 0.040130615234375, 0.05823516845703125, 0.0763397216796875, 0.09444427490234375, 0.112548828125, 0.13065338134765625, 0.1487579345703125, 0.16686248779296875, 0.184967041015625, 0.20307159423828125, 0.2211761474609375, 0.23928070068359375, 0.25738525390625, 0.27548980712890625, 0.2935943603515625, 0.31169891357421875, 0.329803466796875, 0.34790802001953125, 0.3660125732421875, 0.38411712646484375, 0.4022216796875, 0.42032623291015625, 0.4384307861328125, 0.45653533935546875, 0.474639892578125, 0.49274444580078125, 0.5108489990234375, 0.5289535522460938, 0.54705810546875, 0.5651626586914062, 0.5832672119140625, 0.6013717651367188, 0.619476318359375, 0.6375808715820312, 0.6556854248046875, 0.6737899780273438, 0.69189453125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 10.0, 13.0, 30.0, 65.0, 104.0, 166.0, 225.0, 162.0, 102.0, 64.0, 33.0, 14.0, 4.0, 4.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.068559646606445, -7.428589820861816, -6.788619518280029, -6.148649215698242, -5.508679389953613, -4.868709564208984, -4.228739261627197, -3.58876895904541, -2.9487991333007812, -2.3088290691375732, -1.6688590049743652, -1.0288889408111572, -0.3889188766479492, 0.2510511875152588, 0.8910212516784668, 1.530991554260254, 2.170961380004883, 2.810931444168091, 3.450901508331299, 4.090871810913086, 4.730841636657715, 5.370811462402344, 6.010781764984131, 6.650752067565918, 7.290721893310547, 7.930691719055176, 8.570661544799805, 9.21063232421875, 9.850602149963379, 10.490571975708008, 11.130542755126953, 11.770512580871582, 12.410484313964844, 13.050454139709473, 13.690423965454102, 14.330394744873047, 14.970364570617676, 15.610334396362305, 16.25030517578125, 16.890274047851562, 17.530244827270508, 18.170215606689453, 18.810184478759766, 19.45015525817871, 20.090126037597656, 20.73009490966797, 21.370065689086914, 22.01003646850586, 22.650005340576172, 23.289976119995117, 23.92994499206543, 24.569915771484375, 25.209884643554688, 25.849855422973633, 26.489826202392578, 27.12979507446289, 27.769765853881836, 28.40973663330078, 29.049705505371094, 29.68967628479004, 30.329647064208984, 30.969615936279297, 31.609586715698242, 32.24955749511719, 32.8895263671875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 5.0, 12.0, 11.0, 19.0, 13.0, 23.0, 29.0, 23.0, 15.0, 26.0, 29.0, 30.0, 31.0, 28.0, 41.0, 32.0, 34.0, 40.0, 35.0, 38.0, 43.0, 51.0, 25.0, 51.0, 27.0, 48.0, 35.0, 33.0, 16.0, 17.0, 23.0, 23.0, 15.0, 16.0, 8.0, 9.0, 8.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-11.097710609436035, -10.776701927185059, -10.455692291259766, -10.134683609008789, -9.813674926757812, -9.492666244506836, -9.171656608581543, -8.850647926330566, -8.52963924407959, -8.208630561828613, -7.8876214027404785, -7.566612243652344, -7.245603561401367, -6.924594402313232, -6.603585243225098, -6.282576560974121, -5.961567401885986, -5.640558242797852, -5.319549560546875, -4.99854040145874, -4.677531719207764, -4.356522560119629, -4.035513877868652, -3.7145047187805176, -3.393495798110962, -3.0724868774414062, -2.7514779567718506, -2.430469036102295, -2.10945987701416, -1.788451075553894, -1.4674420356750488, -1.1464331150054932, -0.8254241943359375, -0.5044152736663818, -0.1834062933921814, 0.13760268688201904, 0.4586116075515747, 0.7796205282211304, 1.1006295680999756, 1.4216384887695312, 1.742647409439087, 2.0636563301086426, 2.3846652507781982, 2.705674171447754, 3.0266833305358887, 3.3476920127868652, 3.668701171875, 3.9897100925445557, 4.310719013214111, 4.631728172302246, 4.952736854553223, 5.273746013641357, 5.594754695892334, 5.915763854980469, 6.236772537231445, 6.55778169631958, 6.878790855407715, 7.19980001449585, 7.520808696746826, 7.841817855834961, 8.162826538085938, 8.483835220336914, 8.804844856262207, 9.125853538513184, 9.44686222076416]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 0.0, 9.0, 12.0, 10.0, 7.0, 11.0, 28.0, 21.0, 52.0, 40.0, 79.0, 169.0, 327.0, 739.0, 2360.0, 9398.0, 68413.0, 3539895.0, 544538.0, 21809.0, 4085.0, 1244.0, 425.0, 200.0, 128.0, 61.0, 42.0, 35.0, 18.0, 19.0, 27.0, 15.0, 15.0, 13.0, 10.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.1953125, -10.819091796875, -10.44287109375, -10.066650390625, -9.6904296875, -9.314208984375, -8.93798828125, -8.561767578125, -8.185546875, -7.809326171875, -7.43310546875, -7.056884765625, -6.6806640625, -6.304443359375, -5.92822265625, -5.552001953125, -5.17578125, -4.799560546875, -4.42333984375, -4.047119140625, -3.6708984375, -3.294677734375, -2.91845703125, -2.542236328125, -2.166015625, -1.789794921875, -1.41357421875, -1.037353515625, -0.6611328125, -0.284912109375, 0.09130859375, 0.467529296875, 0.84375, 1.219970703125, 1.59619140625, 1.972412109375, 2.3486328125, 2.724853515625, 3.10107421875, 3.477294921875, 3.853515625, 4.229736328125, 4.60595703125, 4.982177734375, 5.3583984375, 5.734619140625, 6.11083984375, 6.487060546875, 6.86328125, 7.239501953125, 7.61572265625, 7.991943359375, 8.3681640625, 8.744384765625, 9.12060546875, 9.496826171875, 9.873046875, 10.249267578125, 10.62548828125, 11.001708984375, 11.3779296875, 11.754150390625, 12.13037109375, 12.506591796875, 12.8828125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 1.0, 7.0, 20.0, 20.0, 14.0, 35.0, 41.0, 49.0, 55.0, 89.0, 79.0, 94.0, 99.0, 68.0, 96.0, 57.0, 56.0, 34.0, 33.0, 22.0, 15.0, 11.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.17327880859375, -3.9910888671875, -3.80889892578125, -3.626708984375, -3.44451904296875, -3.2623291015625, -3.08013916015625, -2.89794921875, -2.71575927734375, -2.5335693359375, -2.35137939453125, -2.169189453125, -1.98699951171875, -1.8048095703125, -1.62261962890625, -1.4404296875, -1.25823974609375, -1.0760498046875, -0.89385986328125, -0.711669921875, -0.52947998046875, -0.3472900390625, -0.16510009765625, 0.01708984375, 0.19927978515625, 0.3814697265625, 0.56365966796875, 0.745849609375, 0.92803955078125, 1.1102294921875, 1.29241943359375, 1.474609375, 1.65679931640625, 1.8389892578125, 2.02117919921875, 2.203369140625, 2.38555908203125, 2.5677490234375, 2.74993896484375, 2.93212890625, 3.11431884765625, 3.2965087890625, 3.47869873046875, 3.660888671875, 3.84307861328125, 4.0252685546875, 4.20745849609375, 4.3896484375, 4.57183837890625, 4.7540283203125, 4.93621826171875, 5.118408203125, 5.30059814453125, 5.4827880859375, 5.66497802734375, 5.84716796875, 6.02935791015625, 6.2115478515625, 6.39373779296875, 6.575927734375, 6.75811767578125, 6.9403076171875, 7.12249755859375, 7.3046875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 13.0, 10.0, 17.0, 18.0, 33.0, 44.0, 67.0, 168.0, 334.0, 852.0, 3478.0, 24247.0, 927796.0, 3187272.0, 42934.0, 5043.0, 1139.0, 383.0, 160.0, 87.0, 50.0, 35.0, 26.0, 15.0, 9.0, 10.0, 8.0, 6.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.2890625, -10.9375, -10.5859375, -10.234375, -9.8828125, -9.53125, -9.1796875, -8.828125, -8.4765625, -8.125, -7.7734375, -7.421875, -7.0703125, -6.71875, -6.3671875, -6.015625, -5.6640625, -5.3125, -4.9609375, -4.609375, -4.2578125, -3.90625, -3.5546875, -3.203125, -2.8515625, -2.5, -2.1484375, -1.796875, -1.4453125, -1.09375, -0.7421875, -0.390625, -0.0390625, 0.3125, 0.6640625, 1.015625, 1.3671875, 1.71875, 2.0703125, 2.421875, 2.7734375, 3.125, 3.4765625, 3.828125, 4.1796875, 4.53125, 4.8828125, 5.234375, 5.5859375, 5.9375, 6.2890625, 6.640625, 6.9921875, 7.34375, 7.6953125, 8.046875, 8.3984375, 8.75, 9.1015625, 9.453125, 9.8046875, 10.15625, 10.5078125, 10.859375, 11.2109375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 10.0, 14.0, 17.0, 26.0, 34.0, 48.0, 55.0, 100.0, 170.0, 256.0, 470.0, 730.0, 822.0, 497.0, 295.0, 147.0, 115.0, 77.0, 49.0, 32.0, 24.0, 18.0, 8.0, 14.0, 11.0, 3.0, 1.0, 9.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.869140625, -1.8108062744140625, -1.752471923828125, -1.6941375732421875, -1.63580322265625, -1.5774688720703125, -1.519134521484375, -1.4608001708984375, -1.4024658203125, -1.3441314697265625, -1.285797119140625, -1.2274627685546875, -1.16912841796875, -1.1107940673828125, -1.052459716796875, -0.9941253662109375, -0.935791015625, -0.8774566650390625, -0.819122314453125, -0.7607879638671875, -0.70245361328125, -0.6441192626953125, -0.585784912109375, -0.5274505615234375, -0.4691162109375, -0.4107818603515625, -0.352447509765625, -0.2941131591796875, -0.23577880859375, -0.1774444580078125, -0.119110107421875, -0.0607757568359375, -0.00244140625, 0.0558929443359375, 0.114227294921875, 0.1725616455078125, 0.23089599609375, 0.2892303466796875, 0.347564697265625, 0.4058990478515625, 0.4642333984375, 0.5225677490234375, 0.580902099609375, 0.6392364501953125, 0.69757080078125, 0.7559051513671875, 0.814239501953125, 0.8725738525390625, 0.930908203125, 0.9892425537109375, 1.047576904296875, 1.1059112548828125, 1.16424560546875, 1.2225799560546875, 1.280914306640625, 1.3392486572265625, 1.3975830078125, 1.4559173583984375, 1.514251708984375, 1.5725860595703125, 1.63092041015625, 1.6892547607421875, 1.747589111328125, 1.8059234619140625, 1.8642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 7.0, 12.0, 31.0, 71.0, 152.0, 265.0, 213.0, 158.0, 59.0, 31.0, 14.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1069159507751465, -4.539866924285889, -3.972817897796631, -3.405768871307373, -2.8387198448181152, -2.2716708183288574, -1.7046217918395996, -1.1375727653503418, -0.570523738861084, -0.003474712371826172, 0.5635743141174316, 1.1306233406066895, 1.6976723670959473, 2.264721393585205, 2.831770420074463, 3.3988194465637207, 3.9658684730529785, 4.532917499542236, 5.099966526031494, 5.667015552520752, 6.23406457901001, 6.801113605499268, 7.368162631988525, 7.935211658477783, 8.502260208129883, 9.06930923461914, 9.636358261108398, 10.203407287597656, 10.770456314086914, 11.337505340576172, 11.90455436706543, 12.471603393554688, 13.038652420043945, 13.605701446533203, 14.172750473022461, 14.739799499511719, 15.306848526000977, 15.873897552490234, 16.440946578979492, 17.00799560546875, 17.575044631958008, 18.142093658447266, 18.709142684936523, 19.27619171142578, 19.84324073791504, 20.410289764404297, 20.977338790893555, 21.544387817382812, 22.11143684387207, 22.678485870361328, 23.245534896850586, 23.812583923339844, 24.3796329498291, 24.94668197631836, 25.513731002807617, 26.080780029296875, 26.647829055786133, 27.21487808227539, 27.78192710876465, 28.348976135253906, 28.916025161743164, 29.483074188232422, 30.05012321472168, 30.617172241210938, 31.184221267700195]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 11.0, 15.0, 15.0, 21.0, 31.0, 28.0, 33.0, 26.0, 44.0, 59.0, 67.0, 45.0, 61.0, 64.0, 64.0, 58.0, 57.0, 51.0, 45.0, 37.0, 34.0, 27.0, 25.0, 23.0, 17.0, 14.0, 11.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.30944299697876, -4.143120288848877, -3.976797342300415, -3.810474395751953, -3.6441516876220703, -3.4778289794921875, -3.3115060329437256, -3.1451830863952637, -2.978860378265381, -2.812537670135498, -2.646214723587036, -2.479891777038574, -2.3135690689086914, -2.1472463607788086, -1.9809234142303467, -1.8146005868911743, -1.648277759552002, -1.4819549322128296, -1.3156321048736572, -1.1493092775344849, -0.9829864501953125, -0.8166636228561401, -0.6503407955169678, -0.4840179681777954, -0.31769514083862305, -0.15137231349945068, 0.01495051383972168, 0.18127334117889404, 0.3475961685180664, 0.5139189958572388, 0.6802418231964111, 0.8465646505355835, 1.012887954711914, 1.1792107820510864, 1.3455336093902588, 1.5118564367294312, 1.6781792640686035, 1.8445020914077759, 2.0108249187469482, 2.17714786529541, 2.343470573425293, 2.509793281555176, 2.6761162281036377, 2.8424391746520996, 3.0087618827819824, 3.1750845909118652, 3.341407537460327, 3.507730484008789, 3.674053192138672, 3.8403759002685547, 4.0066986083984375, 4.1730217933654785, 4.339344501495361, 4.505667209625244, 4.671990394592285, 4.838313102722168, 5.004635810852051, 5.170958518981934, 5.337281227111816, 5.503604412078857, 5.66992712020874, 5.836249828338623, 6.002573013305664, 6.168895721435547, 6.33521842956543]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 7.0, 16.0, 14.0, 17.0, 48.0, 51.0, 104.0, 145.0, 299.0, 552.0, 1125.0, 2336.0, 5536.0, 15172.0, 60381.0, 382348.0, 473440.0, 77392.0, 18279.0, 6091.0, 2599.0, 1248.0, 601.0, 315.0, 168.0, 91.0, 54.0, 39.0, 30.0, 14.0, 14.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.73046875, -1.664093017578125, -1.59771728515625, -1.531341552734375, -1.4649658203125, -1.398590087890625, -1.33221435546875, -1.265838623046875, -1.199462890625, -1.133087158203125, -1.06671142578125, -1.000335693359375, -0.9339599609375, -0.867584228515625, -0.80120849609375, -0.734832763671875, -0.66845703125, -0.602081298828125, -0.53570556640625, -0.469329833984375, -0.4029541015625, -0.336578369140625, -0.27020263671875, -0.203826904296875, -0.137451171875, -0.071075439453125, -0.00469970703125, 0.061676025390625, 0.1280517578125, 0.194427490234375, 0.26080322265625, 0.327178955078125, 0.3935546875, 0.459930419921875, 0.52630615234375, 0.592681884765625, 0.6590576171875, 0.725433349609375, 0.79180908203125, 0.858184814453125, 0.924560546875, 0.990936279296875, 1.05731201171875, 1.123687744140625, 1.1900634765625, 1.256439208984375, 1.32281494140625, 1.389190673828125, 1.45556640625, 1.521942138671875, 1.58831787109375, 1.654693603515625, 1.7210693359375, 1.787445068359375, 1.85382080078125, 1.920196533203125, 1.986572265625, 2.052947998046875, 2.11932373046875, 2.185699462890625, 2.2520751953125, 2.318450927734375, 2.38482666015625, 2.451202392578125, 2.517578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 7.0, 11.0, 9.0, 27.0, 10.0, 29.0, 21.0, 27.0, 28.0, 36.0, 44.0, 38.0, 45.0, 42.0, 47.0, 49.0, 46.0, 53.0, 38.0, 53.0, 46.0, 37.0, 44.0, 26.0, 30.0, 26.0, 23.0, 24.0, 13.0, 12.0, 17.0, 10.0, 8.0, 3.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.841796875, -2.74908447265625, -2.6563720703125, -2.56365966796875, -2.470947265625, -2.37823486328125, -2.2855224609375, -2.19281005859375, -2.10009765625, -2.00738525390625, -1.9146728515625, -1.82196044921875, -1.729248046875, -1.63653564453125, -1.5438232421875, -1.45111083984375, -1.3583984375, -1.26568603515625, -1.1729736328125, -1.08026123046875, -0.987548828125, -0.89483642578125, -0.8021240234375, -0.70941162109375, -0.61669921875, -0.52398681640625, -0.4312744140625, -0.33856201171875, -0.245849609375, -0.15313720703125, -0.0604248046875, 0.03228759765625, 0.125, 0.21771240234375, 0.3104248046875, 0.40313720703125, 0.495849609375, 0.58856201171875, 0.6812744140625, 0.77398681640625, 0.86669921875, 0.95941162109375, 1.0521240234375, 1.14483642578125, 1.237548828125, 1.33026123046875, 1.4229736328125, 1.51568603515625, 1.6083984375, 1.70111083984375, 1.7938232421875, 1.88653564453125, 1.979248046875, 2.07196044921875, 2.1646728515625, 2.25738525390625, 2.35009765625, 2.44281005859375, 2.5355224609375, 2.62823486328125, 2.720947265625, 2.81365966796875, 2.9063720703125, 2.99908447265625, 3.091796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 6.0, 3.0, 14.0, 14.0, 12.0, 23.0, 25.0, 54.0, 86.0, 120.0, 256.0, 468.0, 1028.0, 2283.0, 6130.0, 19711.0, 92958.0, 525844.0, 325907.0, 53407.0, 12681.0, 4174.0, 1669.0, 778.0, 365.0, 206.0, 94.0, 68.0, 48.0, 35.0, 22.0, 19.0, 16.0, 7.0, 8.0, 2.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8447265625, -1.788543701171875, -1.73236083984375, -1.676177978515625, -1.6199951171875, -1.563812255859375, -1.50762939453125, -1.451446533203125, -1.395263671875, -1.339080810546875, -1.28289794921875, -1.226715087890625, -1.1705322265625, -1.114349365234375, -1.05816650390625, -1.001983642578125, -0.94580078125, -0.889617919921875, -0.83343505859375, -0.777252197265625, -0.7210693359375, -0.664886474609375, -0.60870361328125, -0.552520751953125, -0.496337890625, -0.440155029296875, -0.38397216796875, -0.327789306640625, -0.2716064453125, -0.215423583984375, -0.15924072265625, -0.103057861328125, -0.046875, 0.009307861328125, 0.06549072265625, 0.121673583984375, 0.1778564453125, 0.234039306640625, 0.29022216796875, 0.346405029296875, 0.402587890625, 0.458770751953125, 0.51495361328125, 0.571136474609375, 0.6273193359375, 0.683502197265625, 0.73968505859375, 0.795867919921875, 0.85205078125, 0.908233642578125, 0.96441650390625, 1.020599365234375, 1.0767822265625, 1.132965087890625, 1.18914794921875, 1.245330810546875, 1.301513671875, 1.357696533203125, 1.41387939453125, 1.470062255859375, 1.5262451171875, 1.582427978515625, 1.63861083984375, 1.694793701171875, 1.7509765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 10.0, 6.0, 1.0, 11.0, 11.0, 10.0, 17.0, 16.0, 16.0, 22.0, 20.0, 23.0, 23.0, 42.0, 35.0, 29.0, 43.0, 39.0, 40.0, 51.0, 47.0, 45.0, 43.0, 33.0, 36.0, 32.0, 27.0, 35.0, 36.0, 41.0, 29.0, 18.0, 22.0, 12.0, 15.0, 20.0, 13.0, 9.0, 5.0, 4.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.83203125, -5.65875244140625, -5.4854736328125, -5.31219482421875, -5.138916015625, -4.96563720703125, -4.7923583984375, -4.61907958984375, -4.44580078125, -4.27252197265625, -4.0992431640625, -3.92596435546875, -3.752685546875, -3.57940673828125, -3.4061279296875, -3.23284912109375, -3.0595703125, -2.88629150390625, -2.7130126953125, -2.53973388671875, -2.366455078125, -2.19317626953125, -2.0198974609375, -1.84661865234375, -1.67333984375, -1.50006103515625, -1.3267822265625, -1.15350341796875, -0.980224609375, -0.80694580078125, -0.6336669921875, -0.46038818359375, -0.287109375, -0.11383056640625, 0.0594482421875, 0.23272705078125, 0.406005859375, 0.57928466796875, 0.7525634765625, 0.92584228515625, 1.09912109375, 1.27239990234375, 1.4456787109375, 1.61895751953125, 1.792236328125, 1.96551513671875, 2.1387939453125, 2.31207275390625, 2.4853515625, 2.65863037109375, 2.8319091796875, 3.00518798828125, 3.178466796875, 3.35174560546875, 3.5250244140625, 3.69830322265625, 3.87158203125, 4.04486083984375, 4.2181396484375, 4.39141845703125, 4.564697265625, 4.73797607421875, 4.9112548828125, 5.08453369140625, 5.2578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 12.0, 16.0, 15.0, 23.0, 32.0, 56.0, 84.0, 133.0, 222.0, 421.0, 722.0, 1475.0, 3831.0, 12283.0, 78021.0, 712814.0, 207021.0, 21939.0, 5477.0, 2002.0, 863.0, 437.0, 264.0, 127.0, 82.0, 45.0, 40.0, 16.0, 23.0, 14.0, 3.0, 5.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84912109375, -0.8184585571289062, -0.7877960205078125, -0.7571334838867188, -0.726470947265625, -0.6958084106445312, -0.6651458740234375, -0.6344833374023438, -0.60382080078125, -0.5731582641601562, -0.5424957275390625, -0.5118331909179688, -0.481170654296875, -0.45050811767578125, -0.4198455810546875, -0.38918304443359375, -0.3585205078125, -0.32785797119140625, -0.2971954345703125, -0.26653289794921875, -0.235870361328125, -0.20520782470703125, -0.1745452880859375, -0.14388275146484375, -0.11322021484375, -0.08255767822265625, -0.0518951416015625, -0.02123260498046875, 0.009429931640625, 0.04009246826171875, 0.0707550048828125, 0.10141754150390625, 0.132080078125, 0.16274261474609375, 0.1934051513671875, 0.22406768798828125, 0.254730224609375, 0.28539276123046875, 0.3160552978515625, 0.34671783447265625, 0.37738037109375, 0.40804290771484375, 0.4387054443359375, 0.46936798095703125, 0.500030517578125, 0.5306930541992188, 0.5613555908203125, 0.5920181274414062, 0.6226806640625, 0.6533432006835938, 0.6840057373046875, 0.7146682739257812, 0.745330810546875, 0.7759933471679688, 0.8066558837890625, 0.8373184204101562, 0.86798095703125, 0.8986434936523438, 0.9293060302734375, 0.9599685668945312, 0.990631103515625, 1.0212936401367188, 1.0519561767578125, 1.0826187133789062, 1.11328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 5.0, 8.0, 16.0, 19.0, 29.0, 54.0, 50.0, 116.0, 159.0, 157.0, 135.0, 78.0, 56.0, 39.0, 22.0, 13.0, 14.0, 6.0, 4.0, 8.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004048347473144531, -0.00039149075746536255, -0.00037814676761627197, -0.0003648027777671814, -0.0003514587879180908, -0.00033811479806900024, -0.00032477080821990967, -0.0003114268183708191, -0.0002980828285217285, -0.00028473883867263794, -0.00027139484882354736, -0.0002580508589744568, -0.0002447068691253662, -0.00023136287927627563, -0.00021801888942718506, -0.00020467489957809448, -0.0001913309097290039, -0.00017798691987991333, -0.00016464293003082275, -0.00015129894018173218, -0.0001379549503326416, -0.00012461096048355103, -0.00011126697063446045, -9.792298078536987e-05, -8.45789909362793e-05, -7.123500108718872e-05, -5.7891011238098145e-05, -4.454702138900757e-05, -3.120303153991699e-05, -1.7859041690826416e-05, -4.51505184173584e-06, 8.828938007354736e-06, 2.2172927856445312e-05, 3.551691770553589e-05, 4.8860907554626465e-05, 6.220489740371704e-05, 7.554888725280762e-05, 8.88928771018982e-05, 0.00010223686695098877, 0.00011558085680007935, 0.00012892484664916992, 0.0001422688364982605, 0.00015561282634735107, 0.00016895681619644165, 0.00018230080604553223, 0.0001956447958946228, 0.00020898878574371338, 0.00022233277559280396, 0.00023567676544189453, 0.0002490207552909851, 0.0002623647451400757, 0.00027570873498916626, 0.00028905272483825684, 0.0003023967146873474, 0.000315740704536438, 0.00032908469438552856, 0.00034242868423461914, 0.0003557726740837097, 0.0003691166639328003, 0.00038246065378189087, 0.00039580464363098145, 0.000409148633480072, 0.0004224926233291626, 0.0004358366131782532, 0.00044918060302734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 4.0, 5.0, 13.0, 20.0, 28.0, 63.0, 72.0, 126.0, 221.0, 416.0, 873.0, 1783.0, 4962.0, 19568.0, 205694.0, 738420.0, 60793.0, 9824.0, 3003.0, 1261.0, 610.0, 311.0, 194.0, 99.0, 66.0, 29.0, 31.0, 17.0, 8.0, 4.0, 6.0, 3.0, 1.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3876953125, -1.3472137451171875, -1.306732177734375, -1.2662506103515625, -1.22576904296875, -1.1852874755859375, -1.144805908203125, -1.1043243408203125, -1.0638427734375, -1.0233612060546875, -0.982879638671875, -0.9423980712890625, -0.90191650390625, -0.8614349365234375, -0.820953369140625, -0.7804718017578125, -0.739990234375, -0.6995086669921875, -0.659027099609375, -0.6185455322265625, -0.57806396484375, -0.5375823974609375, -0.497100830078125, -0.4566192626953125, -0.4161376953125, -0.3756561279296875, -0.335174560546875, -0.2946929931640625, -0.25421142578125, -0.2137298583984375, -0.173248291015625, -0.1327667236328125, -0.09228515625, -0.0518035888671875, -0.011322021484375, 0.0291595458984375, 0.06964111328125, 0.1101226806640625, 0.150604248046875, 0.1910858154296875, 0.2315673828125, 0.2720489501953125, 0.312530517578125, 0.3530120849609375, 0.39349365234375, 0.4339752197265625, 0.474456787109375, 0.5149383544921875, 0.555419921875, 0.5959014892578125, 0.636383056640625, 0.6768646240234375, 0.71734619140625, 0.7578277587890625, 0.798309326171875, 0.8387908935546875, 0.8792724609375, 0.9197540283203125, 0.960235595703125, 1.0007171630859375, 1.04119873046875, 1.0816802978515625, 1.122161865234375, 1.1626434326171875, 1.203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 4.0, 12.0, 7.0, 15.0, 23.0, 26.0, 47.0, 74.0, 79.0, 152.0, 161.0, 125.0, 72.0, 54.0, 51.0, 23.0, 8.0, 16.0, 10.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.358642578125, -0.3481559753417969, -0.33766937255859375, -0.3271827697753906, -0.3166961669921875, -0.3062095642089844, -0.29572296142578125, -0.2852363586425781, -0.274749755859375, -0.2642631530761719, -0.25377655029296875, -0.24328994750976562, -0.2328033447265625, -0.22231674194335938, -0.21183013916015625, -0.20134353637695312, -0.19085693359375, -0.18037033081054688, -0.16988372802734375, -0.15939712524414062, -0.1489105224609375, -0.13842391967773438, -0.12793731689453125, -0.11745071411132812, -0.106964111328125, -0.09647750854492188, -0.08599090576171875, -0.07550430297851562, -0.0650177001953125, -0.054531097412109375, -0.04404449462890625, -0.033557891845703125, -0.0230712890625, -0.012584686279296875, -0.00209808349609375, 0.008388519287109375, 0.0188751220703125, 0.029361724853515625, 0.03984832763671875, 0.050334930419921875, 0.060821533203125, 0.07130813598632812, 0.08179473876953125, 0.09228134155273438, 0.1027679443359375, 0.11325454711914062, 0.12374114990234375, 0.13422775268554688, 0.14471435546875, 0.15520095825195312, 0.16568756103515625, 0.17617416381835938, 0.1866607666015625, 0.19714736938476562, 0.20763397216796875, 0.21812057495117188, 0.228607177734375, 0.23909378051757812, 0.24958038330078125, 0.2600669860839844, 0.2705535888671875, 0.2810401916503906, 0.29152679443359375, 0.3020133972167969, 0.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 10.0, 19.0, 37.0, 78.0, 118.0, 207.0, 183.0, 148.0, 97.0, 51.0, 35.0, 13.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6614701747894287, -3.362987995147705, -3.0645058155059814, -2.766023635864258, -2.4675416946411133, -2.1690592765808105, -1.870577335357666, -1.5720951557159424, -1.2736129760742188, -0.9751307964324951, -0.6766486763954163, -0.3781665563583374, -0.07968437671661377, 0.21879780292510986, 0.517279863357544, 0.8157620429992676, 1.1142442226409912, 1.4127264022827148, 1.7112085819244385, 2.009690761566162, 2.3081727027893066, 2.6066551208496094, 2.905137062072754, 3.2036192417144775, 3.502101421356201, 3.800583600997925, 4.099065780639648, 4.397547721862793, 4.696030139923096, 4.99451208114624, 5.292994499206543, 5.5914764404296875, 5.889959335327148, 6.188441276550293, 6.486923694610596, 6.78540563583374, 7.083888053894043, 7.3823699951171875, 7.680851936340332, 7.979334354400635, 8.277816772460938, 8.576298713684082, 8.874780654907227, 9.173263549804688, 9.471745491027832, 9.770227432250977, 10.068709373474121, 10.367191314697266, 10.665674209594727, 10.964156150817871, 11.262638092041016, 11.561120986938477, 11.859602928161621, 12.158084869384766, 12.45656681060791, 12.755048751831055, 13.0535306930542, 13.352012634277344, 13.650494575500488, 13.94897747039795, 14.247459411621094, 14.545941352844238, 14.844423294067383, 15.142906188964844, 15.441388130187988]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 8.0, 10.0, 10.0, 16.0, 27.0, 31.0, 21.0, 33.0, 44.0, 39.0, 53.0, 60.0, 63.0, 58.0, 64.0, 61.0, 54.0, 40.0, 51.0, 40.0, 49.0, 43.0, 31.0, 19.0, 19.0, 17.0, 9.0, 7.0, 6.0, 9.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.212761878967285, -3.0995283126831055, -2.986294746398926, -2.873061180114746, -2.7598276138305664, -2.6465940475463867, -2.533360481262207, -2.4201269149780273, -2.3068933486938477, -2.193659782409668, -2.0804262161254883, -1.9671926498413086, -1.853959083557129, -1.7407255172729492, -1.6274919509887695, -1.5142583847045898, -1.4010248184204102, -1.2877912521362305, -1.1745576858520508, -1.061324119567871, -0.9480905532836914, -0.8348569869995117, -0.721623420715332, -0.6083898544311523, -0.49515628814697266, -0.38192272186279297, -0.2686891555786133, -0.1554555892944336, -0.042222023010253906, 0.07101154327392578, 0.18424510955810547, 0.29747867584228516, 0.41071224212646484, 0.5239458084106445, 0.6371793746948242, 0.7504129409790039, 0.8636465072631836, 0.9768800735473633, 1.090113639831543, 1.2033472061157227, 1.3165807723999023, 1.429814338684082, 1.5430479049682617, 1.6562814712524414, 1.769515037536621, 1.8827486038208008, 1.9959821701049805, 2.10921573638916, 2.22244930267334, 2.3356828689575195, 2.448916435241699, 2.562150001525879, 2.6753835678100586, 2.7886171340942383, 2.901850700378418, 3.0150842666625977, 3.1283178329467773, 3.241551399230957, 3.3547849655151367, 3.4680185317993164, 3.581252098083496, 3.694485664367676, 3.8077192306518555, 3.920952796936035, 4.034186363220215]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 14.0, 16.0, 25.0, 50.0, 57.0, 118.0, 176.0, 326.0, 548.0, 972.0, 2039.0, 4121.0, 9805.0, 27851.0, 107261.0, 630072.0, 198398.0, 41998.0, 13746.0, 5504.0, 2586.0, 1276.0, 673.0, 376.0, 190.0, 117.0, 90.0, 45.0, 31.0, 26.0, 13.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.140289306640625, -3.01300048828125, -2.885711669921875, -2.7584228515625, -2.631134033203125, -2.50384521484375, -2.376556396484375, -2.249267578125, -2.121978759765625, -1.99468994140625, -1.867401123046875, -1.7401123046875, -1.612823486328125, -1.48553466796875, -1.358245849609375, -1.23095703125, -1.103668212890625, -0.97637939453125, -0.849090576171875, -0.7218017578125, -0.594512939453125, -0.46722412109375, -0.339935302734375, -0.212646484375, -0.085357666015625, 0.04193115234375, 0.169219970703125, 0.2965087890625, 0.423797607421875, 0.55108642578125, 0.678375244140625, 0.8056640625, 0.932952880859375, 1.06024169921875, 1.187530517578125, 1.3148193359375, 1.442108154296875, 1.56939697265625, 1.696685791015625, 1.823974609375, 1.951263427734375, 2.07855224609375, 2.205841064453125, 2.3331298828125, 2.460418701171875, 2.58770751953125, 2.714996337890625, 2.84228515625, 2.969573974609375, 3.09686279296875, 3.224151611328125, 3.3514404296875, 3.478729248046875, 3.60601806640625, 3.733306884765625, 3.860595703125, 3.987884521484375, 4.11517333984375, 4.242462158203125, 4.3697509765625, 4.497039794921875, 4.62432861328125, 4.751617431640625, 4.87890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 9.0, 7.0, 6.0, 13.0, 12.0, 24.0, 13.0, 15.0, 27.0, 29.0, 28.0, 39.0, 40.0, 52.0, 52.0, 46.0, 66.0, 39.0, 64.0, 45.0, 49.0, 38.0, 41.0, 35.0, 39.0, 31.0, 37.0, 21.0, 19.0, 13.0, 11.0, 9.0, 6.0, 7.0, 6.0, 4.0, 10.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12890625, -4.94940185546875, -4.7698974609375, -4.59039306640625, -4.410888671875, -4.23138427734375, -4.0518798828125, -3.87237548828125, -3.69287109375, -3.51336669921875, -3.3338623046875, -3.15435791015625, -2.974853515625, -2.79534912109375, -2.6158447265625, -2.43634033203125, -2.2568359375, -2.07733154296875, -1.8978271484375, -1.71832275390625, -1.538818359375, -1.35931396484375, -1.1798095703125, -1.00030517578125, -0.82080078125, -0.64129638671875, -0.4617919921875, -0.28228759765625, -0.102783203125, 0.07672119140625, 0.2562255859375, 0.43572998046875, 0.615234375, 0.79473876953125, 0.9742431640625, 1.15374755859375, 1.333251953125, 1.51275634765625, 1.6922607421875, 1.87176513671875, 2.05126953125, 2.23077392578125, 2.4102783203125, 2.58978271484375, 2.769287109375, 2.94879150390625, 3.1282958984375, 3.30780029296875, 3.4873046875, 3.66680908203125, 3.8463134765625, 4.02581787109375, 4.205322265625, 4.38482666015625, 4.5643310546875, 4.74383544921875, 4.92333984375, 5.10284423828125, 5.2823486328125, 5.46185302734375, 5.641357421875, 5.82086181640625, 6.0003662109375, 6.17987060546875, 6.359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 11.0, 5.0, 6.0, 8.0, 10.0, 11.0, 17.0, 26.0, 24.0, 41.0, 54.0, 74.0, 106.0, 150.0, 271.0, 530.0, 1887.0, 9229.0, 126679.0, 863685.0, 38547.0, 4792.0, 1188.0, 454.0, 214.0, 131.0, 94.0, 62.0, 61.0, 41.0, 33.0, 19.0, 23.0, 15.0, 14.0, 10.0, 8.0, 9.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.0234375, -8.7525634765625, -8.481689453125, -8.2108154296875, -7.93994140625, -7.6690673828125, -7.398193359375, -7.1273193359375, -6.8564453125, -6.5855712890625, -6.314697265625, -6.0438232421875, -5.77294921875, -5.5020751953125, -5.231201171875, -4.9603271484375, -4.689453125, -4.4185791015625, -4.147705078125, -3.8768310546875, -3.60595703125, -3.3350830078125, -3.064208984375, -2.7933349609375, -2.5224609375, -2.2515869140625, -1.980712890625, -1.7098388671875, -1.43896484375, -1.1680908203125, -0.897216796875, -0.6263427734375, -0.35546875, -0.0845947265625, 0.186279296875, 0.4571533203125, 0.72802734375, 0.9989013671875, 1.269775390625, 1.5406494140625, 1.8115234375, 2.0823974609375, 2.353271484375, 2.6241455078125, 2.89501953125, 3.1658935546875, 3.436767578125, 3.7076416015625, 3.978515625, 4.2493896484375, 4.520263671875, 4.7911376953125, 5.06201171875, 5.3328857421875, 5.603759765625, 5.8746337890625, 6.1455078125, 6.4163818359375, 6.687255859375, 6.9581298828125, 7.22900390625, 7.4998779296875, 7.770751953125, 8.0416259765625, 8.3125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 8.0, 2.0, 11.0, 12.0, 16.0, 17.0, 18.0, 16.0, 27.0, 24.0, 26.0, 38.0, 39.0, 42.0, 43.0, 53.0, 44.0, 52.0, 59.0, 58.0, 49.0, 45.0, 38.0, 31.0, 36.0, 28.0, 24.0, 29.0, 21.0, 15.0, 19.0, 9.0, 9.0, 7.0, 6.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.77734375, -7.5662841796875, -7.355224609375, -7.1441650390625, -6.93310546875, -6.7220458984375, -6.510986328125, -6.2999267578125, -6.0888671875, -5.8778076171875, -5.666748046875, -5.4556884765625, -5.24462890625, -5.0335693359375, -4.822509765625, -4.6114501953125, -4.400390625, -4.1893310546875, -3.978271484375, -3.7672119140625, -3.55615234375, -3.3450927734375, -3.134033203125, -2.9229736328125, -2.7119140625, -2.5008544921875, -2.289794921875, -2.0787353515625, -1.86767578125, -1.6566162109375, -1.445556640625, -1.2344970703125, -1.0234375, -0.8123779296875, -0.601318359375, -0.3902587890625, -0.17919921875, 0.0318603515625, 0.242919921875, 0.4539794921875, 0.6650390625, 0.8760986328125, 1.087158203125, 1.2982177734375, 1.50927734375, 1.7203369140625, 1.931396484375, 2.1424560546875, 2.353515625, 2.5645751953125, 2.775634765625, 2.9866943359375, 3.19775390625, 3.4088134765625, 3.619873046875, 3.8309326171875, 4.0419921875, 4.2530517578125, 4.464111328125, 4.6751708984375, 4.88623046875, 5.0972900390625, 5.308349609375, 5.5194091796875, 5.73046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 4.0, 4.0, 7.0, 9.0, 9.0, 23.0, 30.0, 73.0, 157.0, 345.0, 1085.0, 4884.0, 43713.0, 837706.0, 146643.0, 11032.0, 1905.0, 483.0, 177.0, 109.0, 49.0, 26.0, 22.0, 17.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.09375, -2.0277099609375, -1.961669921875, -1.8956298828125, -1.82958984375, -1.7635498046875, -1.697509765625, -1.6314697265625, -1.5654296875, -1.4993896484375, -1.433349609375, -1.3673095703125, -1.30126953125, -1.2352294921875, -1.169189453125, -1.1031494140625, -1.037109375, -0.9710693359375, -0.905029296875, -0.8389892578125, -0.77294921875, -0.7069091796875, -0.640869140625, -0.5748291015625, -0.5087890625, -0.4427490234375, -0.376708984375, -0.3106689453125, -0.24462890625, -0.1785888671875, -0.112548828125, -0.0465087890625, 0.01953125, 0.0855712890625, 0.151611328125, 0.2176513671875, 0.28369140625, 0.3497314453125, 0.415771484375, 0.4818115234375, 0.5478515625, 0.6138916015625, 0.679931640625, 0.7459716796875, 0.81201171875, 0.8780517578125, 0.944091796875, 1.0101318359375, 1.076171875, 1.1422119140625, 1.208251953125, 1.2742919921875, 1.34033203125, 1.4063720703125, 1.472412109375, 1.5384521484375, 1.6044921875, 1.6705322265625, 1.736572265625, 1.8026123046875, 1.86865234375, 1.9346923828125, 2.000732421875, 2.0667724609375, 2.1328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 7.0, 10.0, 13.0, 7.0, 14.0, 18.0, 25.0, 48.0, 71.0, 90.0, 118.0, 154.0, 107.0, 82.0, 56.0, 51.0, 35.0, 25.0, 13.0, 7.0, 9.0, 3.0, 7.0, 4.0, 3.0, 6.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021648406982421875, -0.000210542231798172, -0.00020460039377212524, -0.0001986585557460785, -0.00019271671772003174, -0.00018677487969398499, -0.00018083304166793823, -0.00017489120364189148, -0.00016894936561584473, -0.00016300752758979797, -0.00015706568956375122, -0.00015112385153770447, -0.00014518201351165771, -0.00013924017548561096, -0.0001332983374595642, -0.00012735649943351746, -0.0001214146614074707, -0.00011547282338142395, -0.0001095309853553772, -0.00010358914732933044, -9.764730930328369e-05, -9.170547127723694e-05, -8.576363325119019e-05, -7.982179522514343e-05, -7.387995719909668e-05, -6.793811917304993e-05, -6.199628114700317e-05, -5.605444312095642e-05, -5.011260509490967e-05, -4.4170767068862915e-05, -3.822892904281616e-05, -3.228709101676941e-05, -2.6345252990722656e-05, -2.0403414964675903e-05, -1.446157693862915e-05, -8.519738912582397e-06, -2.5779008865356445e-06, 3.3639371395111084e-06, 9.305775165557861e-06, 1.5247613191604614e-05, 2.1189451217651367e-05, 2.713128924369812e-05, 3.307312726974487e-05, 3.9014965295791626e-05, 4.495680332183838e-05, 5.089864134788513e-05, 5.6840479373931885e-05, 6.278231739997864e-05, 6.872415542602539e-05, 7.466599345207214e-05, 8.06078314781189e-05, 8.654966950416565e-05, 9.24915075302124e-05, 9.843334555625916e-05, 0.00010437518358230591, 0.00011031702160835266, 0.00011625885963439941, 0.00012220069766044617, 0.00012814253568649292, 0.00013408437371253967, 0.00014002621173858643, 0.00014596804976463318, 0.00015190988779067993, 0.00015785172581672668, 0.00016379356384277344]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 12.0, 11.0, 22.0, 40.0, 64.0, 130.0, 276.0, 602.0, 1564.0, 5575.0, 37345.0, 701559.0, 275838.0, 19770.0, 3685.0, 1136.0, 487.0, 206.0, 90.0, 44.0, 26.0, 20.0, 12.0, 4.0, 7.0, 4.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3279266357421875, -1.264251708984375, -1.2005767822265625, -1.13690185546875, -1.0732269287109375, -1.009552001953125, -0.9458770751953125, -0.8822021484375, -0.8185272216796875, -0.754852294921875, -0.6911773681640625, -0.62750244140625, -0.5638275146484375, -0.500152587890625, -0.4364776611328125, -0.372802734375, -0.3091278076171875, -0.245452880859375, -0.1817779541015625, -0.11810302734375, -0.0544281005859375, 0.009246826171875, 0.0729217529296875, 0.1365966796875, 0.2002716064453125, 0.263946533203125, 0.3276214599609375, 0.39129638671875, 0.4549713134765625, 0.518646240234375, 0.5823211669921875, 0.64599609375, 0.7096710205078125, 0.773345947265625, 0.8370208740234375, 0.90069580078125, 0.9643707275390625, 1.028045654296875, 1.0917205810546875, 1.1553955078125, 1.2190704345703125, 1.282745361328125, 1.3464202880859375, 1.41009521484375, 1.4737701416015625, 1.537445068359375, 1.6011199951171875, 1.664794921875, 1.7284698486328125, 1.792144775390625, 1.8558197021484375, 1.91949462890625, 1.9831695556640625, 2.046844482421875, 2.1105194091796875, 2.1741943359375, 2.2378692626953125, 2.301544189453125, 2.3652191162109375, 2.42889404296875, 2.4925689697265625, 2.556243896484375, 2.6199188232421875, 2.68359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 2.0, 14.0, 12.0, 13.0, 14.0, 32.0, 36.0, 48.0, 64.0, 98.0, 160.0, 145.0, 83.0, 78.0, 61.0, 43.0, 13.0, 14.0, 17.0, 11.0, 5.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74609375, -0.725372314453125, -0.70465087890625, -0.683929443359375, -0.6632080078125, -0.642486572265625, -0.62176513671875, -0.601043701171875, -0.580322265625, -0.559600830078125, -0.53887939453125, -0.518157958984375, -0.4974365234375, -0.476715087890625, -0.45599365234375, -0.435272216796875, -0.41455078125, -0.393829345703125, -0.37310791015625, -0.352386474609375, -0.3316650390625, -0.310943603515625, -0.29022216796875, -0.269500732421875, -0.248779296875, -0.228057861328125, -0.20733642578125, -0.186614990234375, -0.1658935546875, -0.145172119140625, -0.12445068359375, -0.103729248046875, -0.0830078125, -0.062286376953125, -0.04156494140625, -0.020843505859375, -0.0001220703125, 0.020599365234375, 0.04132080078125, 0.062042236328125, 0.082763671875, 0.103485107421875, 0.12420654296875, 0.144927978515625, 0.1656494140625, 0.186370849609375, 0.20709228515625, 0.227813720703125, 0.24853515625, 0.269256591796875, 0.28997802734375, 0.310699462890625, 0.3314208984375, 0.352142333984375, 0.37286376953125, 0.393585205078125, 0.414306640625, 0.435028076171875, 0.45574951171875, 0.476470947265625, 0.4971923828125, 0.517913818359375, 0.53863525390625, 0.559356689453125, 0.580078125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 28.0, 35.0, 112.0, 162.0, 196.0, 177.0, 132.0, 77.0, 40.0, 17.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.770491600036621, -11.17680835723877, -10.583126068115234, -9.989442825317383, -9.395759582519531, -8.80207633972168, -8.208393096923828, -7.614710807800293, -7.021027565002441, -6.42734432220459, -5.8336615562438965, -5.239978790283203, -4.646295547485352, -4.0526123046875, -3.4589295387268066, -2.8652467727661133, -2.2715635299682617, -1.6778805255889893, -1.0841975212097168, -0.49051451683044434, 0.10316848754882812, 0.6968514919281006, 1.290534496307373, 1.8842172622680664, 2.477900505065918, 3.0715835094451904, 3.665266513824463, 4.258949279785156, 4.852632522583008, 5.446315765380859, 6.039998531341553, 6.633681297302246, 7.227365493774414, 7.821048736572266, 8.414731979370117, 9.008414268493652, 9.602097511291504, 10.195780754089355, 10.78946304321289, 11.383146286010742, 11.976829528808594, 12.570512771606445, 13.164196014404297, 13.757878303527832, 14.351561546325684, 14.945244789123535, 15.53892707824707, 16.132610321044922, 16.726293563842773, 17.319976806640625, 17.913660049438477, 18.507343292236328, 19.101024627685547, 19.6947078704834, 20.28839111328125, 20.8820743560791, 21.475757598876953, 22.069440841674805, 22.663124084472656, 23.256807327270508, 23.85049057006836, 24.444171905517578, 25.03785514831543, 25.63153839111328, 26.225221633911133]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 3.0, 10.0, 6.0, 7.0, 9.0, 13.0, 18.0, 12.0, 15.0, 20.0, 23.0, 26.0, 26.0, 25.0, 24.0, 26.0, 33.0, 35.0, 28.0, 37.0, 36.0, 40.0, 37.0, 44.0, 42.0, 37.0, 29.0, 45.0, 27.0, 37.0, 36.0, 33.0, 16.0, 24.0, 17.0, 19.0, 16.0, 11.0, 7.0, 12.0, 12.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.163599967956543, -8.86579704284668, -8.567995071411133, -8.27019214630127, -7.972389221191406, -7.674586772918701, -7.376784324645996, -7.078981399536133, -6.781178951263428, -6.483376502990723, -6.185573577880859, -5.887771129608154, -5.589968681335449, -5.292165756225586, -4.994363307952881, -4.696560859680176, -4.3987579345703125, -4.100955486297607, -3.803152561187744, -3.505350112915039, -3.207547426223755, -2.9097447395324707, -2.6119422912597656, -2.3141396045684814, -2.0163369178771973, -1.718534231185913, -1.4207316637039185, -1.1229290962219238, -0.8251264095306396, -0.5273237228393555, -0.22952115535736084, 0.06828141212463379, 0.36608409881591797, 0.6638867259025574, 0.9616893529891968, 1.2594919204711914, 1.5572946071624756, 1.8550972938537598, 2.152899742126465, 2.450702428817749, 2.748505115509033, 3.0463078022003174, 3.3441104888916016, 3.6419129371643066, 3.939715623855591, 4.237518310546875, 4.53532075881958, 4.833123207092285, 5.130926132202148, 5.4287285804748535, 5.726531505584717, 6.024333953857422, 6.322136878967285, 6.61993932723999, 6.917741775512695, 7.215544700622559, 7.513347148895264, 7.811149597167969, 8.108952522277832, 8.406755447387695, 8.704557418823242, 9.002360343933105, 9.300163269042969, 9.597965240478516, 9.895768165588379]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 3.0, 10.0, 11.0, 9.0, 18.0, 26.0, 45.0, 49.0, 59.0, 78.0, 103.0, 150.0, 187.0, 283.0, 463.0, 815.0, 1643.0, 4532.0, 17460.0, 160075.0, 3535865.0, 434870.0, 26862.0, 5877.0, 2200.0, 933.0, 496.0, 334.0, 217.0, 150.0, 113.0, 82.0, 62.0, 58.0, 33.0, 41.0, 18.0, 17.0, 12.0, 11.0, 3.0, 0.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.671875, -7.4129638671875, -7.154052734375, -6.8951416015625, -6.63623046875, -6.3773193359375, -6.118408203125, -5.8594970703125, -5.6005859375, -5.3416748046875, -5.082763671875, -4.8238525390625, -4.56494140625, -4.3060302734375, -4.047119140625, -3.7882080078125, -3.529296875, -3.2703857421875, -3.011474609375, -2.7525634765625, -2.49365234375, -2.2347412109375, -1.975830078125, -1.7169189453125, -1.4580078125, -1.1990966796875, -0.940185546875, -0.6812744140625, -0.42236328125, -0.1634521484375, 0.095458984375, 0.3543701171875, 0.61328125, 0.8721923828125, 1.131103515625, 1.3900146484375, 1.64892578125, 1.9078369140625, 2.166748046875, 2.4256591796875, 2.6845703125, 2.9434814453125, 3.202392578125, 3.4613037109375, 3.72021484375, 3.9791259765625, 4.238037109375, 4.4969482421875, 4.755859375, 5.0147705078125, 5.273681640625, 5.5325927734375, 5.79150390625, 6.0504150390625, 6.309326171875, 6.5682373046875, 6.8271484375, 7.0860595703125, 7.344970703125, 7.6038818359375, 7.86279296875, 8.1217041015625, 8.380615234375, 8.6395263671875, 8.8984375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 13.0, 12.0, 13.0, 15.0, 24.0, 29.0, 29.0, 47.0, 49.0, 49.0, 63.0, 59.0, 80.0, 66.0, 69.0, 60.0, 59.0, 48.0, 39.0, 41.0, 30.0, 26.0, 26.0, 18.0, 12.0, 10.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44140625, -3.30987548828125, -3.1783447265625, -3.04681396484375, -2.915283203125, -2.78375244140625, -2.6522216796875, -2.52069091796875, -2.38916015625, -2.25762939453125, -2.1260986328125, -1.99456787109375, -1.863037109375, -1.73150634765625, -1.5999755859375, -1.46844482421875, -1.3369140625, -1.20538330078125, -1.0738525390625, -0.94232177734375, -0.810791015625, -0.67926025390625, -0.5477294921875, -0.41619873046875, -0.28466796875, -0.15313720703125, -0.0216064453125, 0.10992431640625, 0.241455078125, 0.37298583984375, 0.5045166015625, 0.63604736328125, 0.767578125, 0.89910888671875, 1.0306396484375, 1.16217041015625, 1.293701171875, 1.42523193359375, 1.5567626953125, 1.68829345703125, 1.81982421875, 1.95135498046875, 2.0828857421875, 2.21441650390625, 2.345947265625, 2.47747802734375, 2.6090087890625, 2.74053955078125, 2.8720703125, 3.00360107421875, 3.1351318359375, 3.26666259765625, 3.398193359375, 3.52972412109375, 3.6612548828125, 3.79278564453125, 3.92431640625, 4.05584716796875, 4.1873779296875, 4.31890869140625, 4.450439453125, 4.58197021484375, 4.7135009765625, 4.84503173828125, 4.9765625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 7.0, 3.0, 3.0, 6.0, 7.0, 7.0, 16.0, 17.0, 47.0, 46.0, 96.0, 243.0, 841.0, 5869.0, 415903.0, 3753847.0, 15232.0, 1417.0, 362.0, 129.0, 71.0, 35.0, 24.0, 19.0, 12.0, 12.0, 7.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.685302734375, -9.15185546875, -8.618408203125, -8.0849609375, -7.551513671875, -7.01806640625, -6.484619140625, -5.951171875, -5.417724609375, -4.88427734375, -4.350830078125, -3.8173828125, -3.283935546875, -2.75048828125, -2.217041015625, -1.68359375, -1.150146484375, -0.61669921875, -0.083251953125, 0.4501953125, 0.983642578125, 1.51708984375, 2.050537109375, 2.583984375, 3.117431640625, 3.65087890625, 4.184326171875, 4.7177734375, 5.251220703125, 5.78466796875, 6.318115234375, 6.8515625, 7.385009765625, 7.91845703125, 8.451904296875, 8.9853515625, 9.518798828125, 10.05224609375, 10.585693359375, 11.119140625, 11.652587890625, 12.18603515625, 12.719482421875, 13.2529296875, 13.786376953125, 14.31982421875, 14.853271484375, 15.38671875, 15.920166015625, 16.45361328125, 16.987060546875, 17.5205078125, 18.053955078125, 18.58740234375, 19.120849609375, 19.654296875, 20.187744140625, 20.72119140625, 21.254638671875, 21.7880859375, 22.321533203125, 22.85498046875, 23.388427734375, 23.921875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 2.0, 9.0, 11.0, 11.0, 12.0, 15.0, 30.0, 50.0, 52.0, 85.0, 123.0, 165.0, 310.0, 474.0, 595.0, 687.0, 514.0, 313.0, 190.0, 120.0, 93.0, 54.0, 24.0, 32.0, 25.0, 16.0, 10.0, 14.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0], "bins": [-1.9453125, -1.8941650390625, -1.843017578125, -1.7918701171875, -1.74072265625, -1.6895751953125, -1.638427734375, -1.5872802734375, -1.5361328125, -1.4849853515625, -1.433837890625, -1.3826904296875, -1.33154296875, -1.2803955078125, -1.229248046875, -1.1781005859375, -1.126953125, -1.0758056640625, -1.024658203125, -0.9735107421875, -0.92236328125, -0.8712158203125, -0.820068359375, -0.7689208984375, -0.7177734375, -0.6666259765625, -0.615478515625, -0.5643310546875, -0.51318359375, -0.4620361328125, -0.410888671875, -0.3597412109375, -0.30859375, -0.2574462890625, -0.206298828125, -0.1551513671875, -0.10400390625, -0.0528564453125, -0.001708984375, 0.0494384765625, 0.1005859375, 0.1517333984375, 0.202880859375, 0.2540283203125, 0.30517578125, 0.3563232421875, 0.407470703125, 0.4586181640625, 0.509765625, 0.5609130859375, 0.612060546875, 0.6632080078125, 0.71435546875, 0.7655029296875, 0.816650390625, 0.8677978515625, 0.9189453125, 0.9700927734375, 1.021240234375, 1.0723876953125, 1.12353515625, 1.1746826171875, 1.225830078125, 1.2769775390625, 1.328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 2.0, 10.0, 16.0, 22.0, 25.0, 41.0, 71.0, 100.0, 131.0, 143.0, 115.0, 137.0, 80.0, 37.0, 30.0, 25.0, 15.0, 11.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.551288604736328, -3.272958993911743, -2.994629383087158, -2.716299533843994, -2.437969923019409, -2.159640312194824, -1.8813105821609497, -1.6029808521270752, -1.3246512413024902, -1.0463216304779053, -0.7679919004440308, -0.489662230014801, -0.2113325595855713, 0.06699705123901367, 0.3453267812728882, 0.6236565113067627, 0.9019861221313477, 1.1803157329559326, 1.4586454629898071, 1.7369751930236816, 2.0153048038482666, 2.2936344146728516, 2.5719642639160156, 2.8502938747406006, 3.1286234855651855, 3.4069530963897705, 3.6852827072143555, 3.9636125564575195, 4.241942405700684, 4.5202717781066895, 4.7986016273498535, 5.076930999755859, 5.355259895324707, 5.633589744567871, 5.911919116973877, 6.190248966217041, 6.468578338623047, 6.746908187866211, 7.025238037109375, 7.303567886352539, 7.581897258758545, 7.860227108001709, 8.138556480407715, 8.416886329650879, 8.695216178894043, 8.97354507446289, 9.251874923706055, 9.530204772949219, 9.808534622192383, 10.086864471435547, 10.365194320678711, 10.643523216247559, 10.921853065490723, 11.200182914733887, 11.47851276397705, 11.756842613220215, 12.035171508789062, 12.313501358032227, 12.59183120727539, 12.870160102844238, 13.148489952087402, 13.426819801330566, 13.70514965057373, 13.983479499816895, 14.261809349060059]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 2.0, 5.0, 10.0, 12.0, 14.0, 13.0, 18.0, 18.0, 22.0, 27.0, 24.0, 32.0, 42.0, 33.0, 39.0, 31.0, 49.0, 40.0, 39.0, 47.0, 46.0, 48.0, 49.0, 34.0, 35.0, 26.0, 33.0, 24.0, 24.0, 31.0, 28.0, 19.0, 27.0, 12.0, 11.0, 8.0, 4.0, 4.0, 7.0, 4.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3730459213256836, -3.2639875411987305, -3.1549289226531982, -3.045870542526245, -2.936811923980713, -2.8277535438537598, -2.7186951637268066, -2.6096365451812744, -2.500577926635742, -2.391519546508789, -2.282460927963257, -2.1734025478363037, -2.0643439292907715, -1.9552855491638184, -1.8462270498275757, -1.737168550491333, -1.6281101703643799, -1.5190516710281372, -1.4099931716918945, -1.3009347915649414, -1.1918761730194092, -1.082817792892456, -0.9737592935562134, -0.8647007942199707, -0.755642294883728, -0.6465837955474854, -0.5375252962112427, -0.4284668564796448, -0.3194083571434021, -0.21034985780715942, -0.10129141807556152, 0.007767081260681152, 0.11682581901550293, 0.2258843034505844, 0.3349427878856659, 0.4440012574195862, 0.5530597567558289, 0.6621182560920715, 0.7711766958236694, 0.8802351951599121, 0.9892936944961548, 1.0983521938323975, 1.2074106931686401, 1.3164691925048828, 1.425527572631836, 1.5345861911773682, 1.6436445713043213, 1.752703070640564, 1.8617615699768066, 1.9708200693130493, 2.079878568649292, 2.188936948776245, 2.2979955673217773, 2.4070539474487305, 2.5161123275756836, 2.625170946121216, 2.734229564666748, 2.843287944793701, 2.9523465633392334, 3.0614049434661865, 3.1704635620117188, 3.279521942138672, 3.388580322265625, 3.4976389408111572, 3.6066973209381104]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 9.0, 19.0, 22.0, 38.0, 63.0, 97.0, 135.0, 274.0, 477.0, 875.0, 1606.0, 3406.0, 7035.0, 15521.0, 38356.0, 109111.0, 332785.0, 348906.0, 117532.0, 40749.0, 16876.0, 7297.0, 3575.0, 1685.0, 908.0, 503.0, 276.0, 151.0, 85.0, 55.0, 46.0, 20.0, 14.0, 15.0, 10.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3486328125, -1.3101348876953125, -1.271636962890625, -1.2331390380859375, -1.19464111328125, -1.1561431884765625, -1.117645263671875, -1.0791473388671875, -1.0406494140625, -1.0021514892578125, -0.963653564453125, -0.9251556396484375, -0.88665771484375, -0.8481597900390625, -0.809661865234375, -0.7711639404296875, -0.732666015625, -0.6941680908203125, -0.655670166015625, -0.6171722412109375, -0.57867431640625, -0.5401763916015625, -0.501678466796875, -0.4631805419921875, -0.4246826171875, -0.3861846923828125, -0.347686767578125, -0.3091888427734375, -0.27069091796875, -0.2321929931640625, -0.193695068359375, -0.1551971435546875, -0.11669921875, -0.0782012939453125, -0.039703369140625, -0.0012054443359375, 0.03729248046875, 0.0757904052734375, 0.114288330078125, 0.1527862548828125, 0.1912841796875, 0.2297821044921875, 0.268280029296875, 0.3067779541015625, 0.34527587890625, 0.3837738037109375, 0.422271728515625, 0.4607696533203125, 0.499267578125, 0.5377655029296875, 0.576263427734375, 0.6147613525390625, 0.65325927734375, 0.6917572021484375, 0.730255126953125, 0.7687530517578125, 0.8072509765625, 0.8457489013671875, 0.884246826171875, 0.9227447509765625, 0.96124267578125, 0.9997406005859375, 1.038238525390625, 1.0767364501953125, 1.115234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 4.0, 7.0, 12.0, 7.0, 12.0, 18.0, 20.0, 25.0, 23.0, 22.0, 36.0, 43.0, 28.0, 47.0, 53.0, 47.0, 40.0, 57.0, 39.0, 43.0, 61.0, 47.0, 43.0, 31.0, 38.0, 24.0, 25.0, 31.0, 21.0, 21.0, 15.0, 17.0, 8.0, 8.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -2.00445556640625, -1.9346923828125, -1.86492919921875, -1.795166015625, -1.72540283203125, -1.6556396484375, -1.58587646484375, -1.51611328125, -1.44635009765625, -1.3765869140625, -1.30682373046875, -1.237060546875, -1.16729736328125, -1.0975341796875, -1.02777099609375, -0.9580078125, -0.88824462890625, -0.8184814453125, -0.74871826171875, -0.678955078125, -0.60919189453125, -0.5394287109375, -0.46966552734375, -0.39990234375, -0.33013916015625, -0.2603759765625, -0.19061279296875, -0.120849609375, -0.05108642578125, 0.0186767578125, 0.08843994140625, 0.158203125, 0.22796630859375, 0.2977294921875, 0.36749267578125, 0.437255859375, 0.50701904296875, 0.5767822265625, 0.64654541015625, 0.71630859375, 0.78607177734375, 0.8558349609375, 0.92559814453125, 0.995361328125, 1.06512451171875, 1.1348876953125, 1.20465087890625, 1.2744140625, 1.34417724609375, 1.4139404296875, 1.48370361328125, 1.553466796875, 1.62322998046875, 1.6929931640625, 1.76275634765625, 1.83251953125, 1.90228271484375, 1.9720458984375, 2.04180908203125, 2.111572265625, 2.18133544921875, 2.2510986328125, 2.32086181640625, 2.390625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 11.0, 4.0, 2.0, 4.0, 8.0, 7.0, 15.0, 16.0, 19.0, 24.0, 40.0, 49.0, 76.0, 90.0, 176.0, 279.0, 509.0, 1095.0, 2495.0, 6740.0, 21466.0, 87487.0, 448872.0, 378949.0, 71471.0, 18235.0, 5877.0, 2272.0, 1054.0, 476.0, 245.0, 181.0, 88.0, 75.0, 36.0, 30.0, 19.0, 19.0, 15.0, 6.0, 10.0, 10.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55078125, -1.4989776611328125, -1.447174072265625, -1.3953704833984375, -1.34356689453125, -1.2917633056640625, -1.239959716796875, -1.1881561279296875, -1.1363525390625, -1.0845489501953125, -1.032745361328125, -0.9809417724609375, -0.92913818359375, -0.8773345947265625, -0.825531005859375, -0.7737274169921875, -0.721923828125, -0.6701202392578125, -0.618316650390625, -0.5665130615234375, -0.51470947265625, -0.4629058837890625, -0.411102294921875, -0.3592987060546875, -0.3074951171875, -0.2556915283203125, -0.203887939453125, -0.1520843505859375, -0.10028076171875, -0.0484771728515625, 0.003326416015625, 0.0551300048828125, 0.10693359375, 0.1587371826171875, 0.210540771484375, 0.2623443603515625, 0.31414794921875, 0.3659515380859375, 0.417755126953125, 0.4695587158203125, 0.5213623046875, 0.5731658935546875, 0.624969482421875, 0.6767730712890625, 0.72857666015625, 0.7803802490234375, 0.832183837890625, 0.8839874267578125, 0.935791015625, 0.9875946044921875, 1.039398193359375, 1.0912017822265625, 1.14300537109375, 1.1948089599609375, 1.246612548828125, 1.2984161376953125, 1.3502197265625, 1.4020233154296875, 1.453826904296875, 1.5056304931640625, 1.55743408203125, 1.6092376708984375, 1.661041259765625, 1.7128448486328125, 1.7646484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 17.0, 13.0, 14.0, 14.0, 23.0, 24.0, 33.0, 37.0, 31.0, 46.0, 43.0, 53.0, 58.0, 43.0, 65.0, 72.0, 42.0, 50.0, 52.0, 32.0, 45.0, 33.0, 27.0, 25.0, 20.0, 14.0, 13.0, 13.0, 10.0, 5.0, 10.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.7623291015625, -5.591064453125, -5.4197998046875, -5.24853515625, -5.0772705078125, -4.906005859375, -4.7347412109375, -4.5634765625, -4.3922119140625, -4.220947265625, -4.0496826171875, -3.87841796875, -3.7071533203125, -3.535888671875, -3.3646240234375, -3.193359375, -3.0220947265625, -2.850830078125, -2.6795654296875, -2.50830078125, -2.3370361328125, -2.165771484375, -1.9945068359375, -1.8232421875, -1.6519775390625, -1.480712890625, -1.3094482421875, -1.13818359375, -0.9669189453125, -0.795654296875, -0.6243896484375, -0.453125, -0.2818603515625, -0.110595703125, 0.0606689453125, 0.23193359375, 0.4031982421875, 0.574462890625, 0.7457275390625, 0.9169921875, 1.0882568359375, 1.259521484375, 1.4307861328125, 1.60205078125, 1.7733154296875, 1.944580078125, 2.1158447265625, 2.287109375, 2.4583740234375, 2.629638671875, 2.8009033203125, 2.97216796875, 3.1434326171875, 3.314697265625, 3.4859619140625, 3.6572265625, 3.8284912109375, 3.999755859375, 4.1710205078125, 4.34228515625, 4.5135498046875, 4.684814453125, 4.8560791015625, 5.02734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 12.0, 7.0, 15.0, 26.0, 23.0, 56.0, 74.0, 94.0, 143.0, 223.0, 323.0, 498.0, 753.0, 1095.0, 1961.0, 3421.0, 6376.0, 16320.0, 70189.0, 558619.0, 322596.0, 41539.0, 11889.0, 5025.0, 2814.0, 1561.0, 934.0, 636.0, 408.0, 319.0, 192.0, 111.0, 86.0, 54.0, 39.0, 25.0, 24.0, 19.0, 15.0, 4.0, 6.0, 7.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.001953125, -0.9714508056640625, -0.940948486328125, -0.9104461669921875, -0.87994384765625, -0.8494415283203125, -0.818939208984375, -0.7884368896484375, -0.7579345703125, -0.7274322509765625, -0.696929931640625, -0.6664276123046875, -0.63592529296875, -0.6054229736328125, -0.574920654296875, -0.5444183349609375, -0.513916015625, -0.4834136962890625, -0.452911376953125, -0.4224090576171875, -0.39190673828125, -0.3614044189453125, -0.330902099609375, -0.3003997802734375, -0.2698974609375, -0.2393951416015625, -0.208892822265625, -0.1783905029296875, -0.14788818359375, -0.1173858642578125, -0.086883544921875, -0.0563812255859375, -0.02587890625, 0.0046234130859375, 0.035125732421875, 0.0656280517578125, 0.09613037109375, 0.1266326904296875, 0.157135009765625, 0.1876373291015625, 0.2181396484375, 0.2486419677734375, 0.279144287109375, 0.3096466064453125, 0.34014892578125, 0.3706512451171875, 0.401153564453125, 0.4316558837890625, 0.462158203125, 0.4926605224609375, 0.523162841796875, 0.5536651611328125, 0.58416748046875, 0.6146697998046875, 0.645172119140625, 0.6756744384765625, 0.7061767578125, 0.7366790771484375, 0.767181396484375, 0.7976837158203125, 0.82818603515625, 0.8586883544921875, 0.889190673828125, 0.9196929931640625, 0.9501953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 10.0, 19.0, 17.0, 28.0, 37.0, 51.0, 90.0, 97.0, 132.0, 138.0, 100.0, 71.0, 43.0, 41.0, 28.0, 22.0, 10.0, 7.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0004513263702392578, -0.00043908506631851196, -0.0004268437623977661, -0.00041460245847702026, -0.0004023611545562744, -0.00039011985063552856, -0.0003778785467147827, -0.00036563724279403687, -0.000353395938873291, -0.00034115463495254517, -0.0003289133310317993, -0.00031667202711105347, -0.0003044307231903076, -0.00029218941926956177, -0.0002799481153488159, -0.00026770681142807007, -0.0002554655075073242, -0.00024322420358657837, -0.00023098289966583252, -0.00021874159574508667, -0.00020650029182434082, -0.00019425898790359497, -0.00018201768398284912, -0.00016977638006210327, -0.00015753507614135742, -0.00014529377222061157, -0.00013305246829986572, -0.00012081116437911987, -0.00010856986045837402, -9.632855653762817e-05, -8.408725261688232e-05, -7.184594869613647e-05, -5.9604644775390625e-05, -4.7363340854644775e-05, -3.5122036933898926e-05, -2.2880733013153076e-05, -1.0639429092407227e-05, 1.601874828338623e-06, 1.3843178749084473e-05, 2.6084482669830322e-05, 3.832578659057617e-05, 5.056709051132202e-05, 6.280839443206787e-05, 7.504969835281372e-05, 8.729100227355957e-05, 9.953230619430542e-05, 0.00011177361011505127, 0.00012401491403579712, 0.00013625621795654297, 0.00014849752187728882, 0.00016073882579803467, 0.00017298012971878052, 0.00018522143363952637, 0.00019746273756027222, 0.00020970404148101807, 0.00022194534540176392, 0.00023418664932250977, 0.0002464279532432556, 0.00025866925716400146, 0.0002709105610847473, 0.00028315186500549316, 0.000295393168926239, 0.00030763447284698486, 0.0003198757767677307, 0.00033211708068847656]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 8.0, 4.0, 10.0, 6.0, 17.0, 11.0, 25.0, 31.0, 62.0, 98.0, 150.0, 282.0, 398.0, 734.0, 1319.0, 2577.0, 5301.0, 12820.0, 47785.0, 373298.0, 508497.0, 66923.0, 15616.0, 5966.0, 2972.0, 1515.0, 870.0, 506.0, 269.0, 160.0, 100.0, 76.0, 33.0, 30.0, 19.0, 18.0, 10.0, 5.0, 9.0, 9.0, 4.0, 3.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.125, -1.09100341796875, -1.0570068359375, -1.02301025390625, -0.989013671875, -0.95501708984375, -0.9210205078125, -0.88702392578125, -0.85302734375, -0.81903076171875, -0.7850341796875, -0.75103759765625, -0.717041015625, -0.68304443359375, -0.6490478515625, -0.61505126953125, -0.5810546875, -0.54705810546875, -0.5130615234375, -0.47906494140625, -0.445068359375, -0.41107177734375, -0.3770751953125, -0.34307861328125, -0.30908203125, -0.27508544921875, -0.2410888671875, -0.20709228515625, -0.173095703125, -0.13909912109375, -0.1051025390625, -0.07110595703125, -0.037109375, -0.00311279296875, 0.0308837890625, 0.06488037109375, 0.098876953125, 0.13287353515625, 0.1668701171875, 0.20086669921875, 0.23486328125, 0.26885986328125, 0.3028564453125, 0.33685302734375, 0.370849609375, 0.40484619140625, 0.4388427734375, 0.47283935546875, 0.5068359375, 0.54083251953125, 0.5748291015625, 0.60882568359375, 0.642822265625, 0.67681884765625, 0.7108154296875, 0.74481201171875, 0.77880859375, 0.81280517578125, 0.8468017578125, 0.88079833984375, 0.914794921875, 0.94879150390625, 0.9827880859375, 1.01678466796875, 1.05078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 7.0, 6.0, 12.0, 7.0, 18.0, 16.0, 47.0, 74.0, 83.0, 101.0, 124.0, 108.0, 109.0, 77.0, 56.0, 42.0, 18.0, 15.0, 8.0, 6.0, 11.0, 6.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.21961212158203125, -0.2104644775390625, -0.20131683349609375, -0.192169189453125, -0.18302154541015625, -0.1738739013671875, -0.16472625732421875, -0.15557861328125, -0.14643096923828125, -0.1372833251953125, -0.12813568115234375, -0.118988037109375, -0.10984039306640625, -0.1006927490234375, -0.09154510498046875, -0.0823974609375, -0.07324981689453125, -0.0641021728515625, -0.05495452880859375, -0.045806884765625, -0.03665924072265625, -0.0275115966796875, -0.01836395263671875, -0.00921630859375, -6.866455078125e-05, 0.0090789794921875, 0.01822662353515625, 0.027374267578125, 0.03652191162109375, 0.0456695556640625, 0.05481719970703125, 0.06396484375, 0.07311248779296875, 0.0822601318359375, 0.09140777587890625, 0.100555419921875, 0.10970306396484375, 0.1188507080078125, 0.12799835205078125, 0.13714599609375, 0.14629364013671875, 0.1554412841796875, 0.16458892822265625, 0.173736572265625, 0.18288421630859375, 0.1920318603515625, 0.20117950439453125, 0.2103271484375, 0.21947479248046875, 0.2286224365234375, 0.23777008056640625, 0.246917724609375, 0.25606536865234375, 0.2652130126953125, 0.27436065673828125, 0.28350830078125, 0.29265594482421875, 0.3018035888671875, 0.31095123291015625, 0.320098876953125, 0.32924652099609375, 0.3383941650390625, 0.34754180908203125, 0.356689453125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 7.0, 6.0, 15.0, 21.0, 21.0, 44.0, 45.0, 60.0, 90.0, 107.0, 125.0, 114.0, 104.0, 86.0, 48.0, 49.0, 23.0, 19.0, 9.0, 10.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1956605911254883, -2.0638885498046875, -1.9321165084838867, -1.800344467163086, -1.6685724258422852, -1.5368003845214844, -1.4050283432006836, -1.2732563018798828, -1.141484260559082, -1.0097122192382812, -0.8779401779174805, -0.7461681365966797, -0.6143960952758789, -0.4826240539550781, -0.35085201263427734, -0.21907997131347656, -0.08730792999267578, 0.044464111328125, 0.17623615264892578, 0.30800819396972656, 0.43978023529052734, 0.5715522766113281, 0.7033243179321289, 0.8350963592529297, 0.9668684005737305, 1.0986404418945312, 1.230412483215332, 1.3621845245361328, 1.4939565658569336, 1.6257286071777344, 1.7575006484985352, 1.889272689819336, 2.0210442543029785, 2.1528162956237793, 2.28458833694458, 2.416360378265381, 2.5481324195861816, 2.6799044609069824, 2.811676502227783, 2.943448543548584, 3.0752205848693848, 3.2069926261901855, 3.3387646675109863, 3.470536708831787, 3.602308750152588, 3.7340807914733887, 3.8658528327941895, 3.9976248741149902, 4.129396915435791, 4.261168956756592, 4.392940998077393, 4.524713039398193, 4.656485080718994, 4.788257122039795, 4.920029163360596, 5.0518012046813965, 5.183573246002197, 5.315345287322998, 5.447117328643799, 5.5788893699646, 5.7106614112854, 5.842433452606201, 5.974205493927002, 6.105977535247803, 6.2377495765686035]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 7.0, 10.0, 12.0, 18.0, 18.0, 17.0, 21.0, 23.0, 30.0, 35.0, 27.0, 39.0, 56.0, 55.0, 34.0, 39.0, 39.0, 50.0, 50.0, 54.0, 45.0, 45.0, 26.0, 42.0, 35.0, 31.0, 23.0, 21.0, 24.0, 17.0, 12.0, 6.0, 9.0, 6.0, 3.0, 1.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05198073387146, -1.9827872514724731, -1.9135937690734863, -1.8444002866744995, -1.7752068042755127, -1.7060132026672363, -1.6368197202682495, -1.5676262378692627, -1.4984327554702759, -1.429239273071289, -1.3600457906723022, -1.2908523082733154, -1.221658706665039, -1.1524653434753418, -1.0832717418670654, -1.0140782594680786, -0.9448847770690918, -0.875691294670105, -0.8064978122711182, -0.7373042702674866, -0.6681107878684998, -0.5989173054695129, -0.5297237634658813, -0.46053028106689453, -0.3913367986679077, -0.3221433162689209, -0.2529498040676117, -0.18375630676746368, -0.11456280946731567, -0.04536932706832886, 0.023824185132980347, 0.09301769733428955, 0.16221117973327637, 0.23140467703342438, 0.3005981743335724, 0.3697916865348816, 0.4389851689338684, 0.5081786513328552, 0.5773721933364868, 0.6465656757354736, 0.7157591581344604, 0.7849526405334473, 0.8541461229324341, 0.9233396649360657, 0.9925331473350525, 1.0617265701293945, 1.130920171737671, 1.2001136541366577, 1.2693071365356445, 1.3385006189346313, 1.4076941013336182, 1.476887583732605, 1.5460810661315918, 1.6152746677398682, 1.684468150138855, 1.7536616325378418, 1.8228551149368286, 1.8920485973358154, 1.9612420797348022, 2.030435562133789, 2.0996291637420654, 2.1688225269317627, 2.238016128540039, 2.3072094917297363, 2.3764030933380127]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 16.0, 20.0, 35.0, 53.0, 79.0, 145.0, 274.0, 491.0, 1102.0, 2442.0, 6339.0, 19377.0, 74314.0, 434389.0, 409823.0, 70464.0, 18500.0, 6109.0, 2359.0, 1044.0, 543.0, 263.0, 133.0, 92.0, 45.0, 29.0, 30.0, 13.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.67578125, -4.549346923828125, -4.42291259765625, -4.296478271484375, -4.1700439453125, -4.043609619140625, -3.91717529296875, -3.790740966796875, -3.664306640625, -3.537872314453125, -3.41143798828125, -3.285003662109375, -3.1585693359375, -3.032135009765625, -2.90570068359375, -2.779266357421875, -2.65283203125, -2.526397705078125, -2.39996337890625, -2.273529052734375, -2.1470947265625, -2.020660400390625, -1.89422607421875, -1.767791748046875, -1.641357421875, -1.514923095703125, -1.38848876953125, -1.262054443359375, -1.1356201171875, -1.009185791015625, -0.88275146484375, -0.756317138671875, -0.6298828125, -0.503448486328125, -0.37701416015625, -0.250579833984375, -0.1241455078125, 0.002288818359375, 0.12872314453125, 0.255157470703125, 0.381591796875, 0.508026123046875, 0.63446044921875, 0.760894775390625, 0.8873291015625, 1.013763427734375, 1.14019775390625, 1.266632080078125, 1.39306640625, 1.519500732421875, 1.64593505859375, 1.772369384765625, 1.8988037109375, 2.025238037109375, 2.15167236328125, 2.278106689453125, 2.404541015625, 2.530975341796875, 2.65740966796875, 2.783843994140625, 2.9102783203125, 3.036712646484375, 3.16314697265625, 3.289581298828125, 3.416015625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 5.0, 8.0, 15.0, 18.0, 23.0, 23.0, 26.0, 33.0, 51.0, 45.0, 33.0, 55.0, 57.0, 55.0, 66.0, 52.0, 48.0, 66.0, 55.0, 56.0, 47.0, 36.0, 28.0, 25.0, 18.0, 14.0, 5.0, 14.0, 4.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.69134521484375, -4.4998779296875, -4.30841064453125, -4.116943359375, -3.92547607421875, -3.7340087890625, -3.54254150390625, -3.35107421875, -3.15960693359375, -2.9681396484375, -2.77667236328125, -2.585205078125, -2.39373779296875, -2.2022705078125, -2.01080322265625, -1.8193359375, -1.62786865234375, -1.4364013671875, -1.24493408203125, -1.053466796875, -0.86199951171875, -0.6705322265625, -0.47906494140625, -0.28759765625, -0.09613037109375, 0.0953369140625, 0.28680419921875, 0.478271484375, 0.66973876953125, 0.8612060546875, 1.05267333984375, 1.244140625, 1.43560791015625, 1.6270751953125, 1.81854248046875, 2.010009765625, 2.20147705078125, 2.3929443359375, 2.58441162109375, 2.77587890625, 2.96734619140625, 3.1588134765625, 3.35028076171875, 3.541748046875, 3.73321533203125, 3.9246826171875, 4.11614990234375, 4.3076171875, 4.49908447265625, 4.6905517578125, 4.88201904296875, 5.073486328125, 5.26495361328125, 5.4564208984375, 5.64788818359375, 5.83935546875, 6.03082275390625, 6.2222900390625, 6.41375732421875, 6.605224609375, 6.79669189453125, 6.9881591796875, 7.17962646484375, 7.37109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 9.0, 6.0, 13.0, 23.0, 32.0, 67.0, 83.0, 180.0, 462.0, 1594.0, 9489.0, 140000.0, 841695.0, 48383.0, 4894.0, 978.0, 303.0, 143.0, 81.0, 36.0, 24.0, 18.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.53125, -6.2734375, -6.015625, -5.7578125, -5.5, -5.2421875, -4.984375, -4.7265625, -4.46875, -4.2109375, -3.953125, -3.6953125, -3.4375, -3.1796875, -2.921875, -2.6640625, -2.40625, -2.1484375, -1.890625, -1.6328125, -1.375, -1.1171875, -0.859375, -0.6015625, -0.34375, -0.0859375, 0.171875, 0.4296875, 0.6875, 0.9453125, 1.203125, 1.4609375, 1.71875, 1.9765625, 2.234375, 2.4921875, 2.75, 3.0078125, 3.265625, 3.5234375, 3.78125, 4.0390625, 4.296875, 4.5546875, 4.8125, 5.0703125, 5.328125, 5.5859375, 5.84375, 6.1015625, 6.359375, 6.6171875, 6.875, 7.1328125, 7.390625, 7.6484375, 7.90625, 8.1640625, 8.421875, 8.6796875, 8.9375, 9.1953125, 9.453125, 9.7109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 14.0, 9.0, 20.0, 23.0, 21.0, 23.0, 38.0, 33.0, 31.0, 45.0, 39.0, 54.0, 57.0, 66.0, 67.0, 57.0, 55.0, 52.0, 55.0, 38.0, 46.0, 18.0, 17.0, 19.0, 23.0, 18.0, 10.0, 10.0, 12.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.036865234375, -5.81982421875, -5.602783203125, -5.3857421875, -5.168701171875, -4.95166015625, -4.734619140625, -4.517578125, -4.300537109375, -4.08349609375, -3.866455078125, -3.6494140625, -3.432373046875, -3.21533203125, -2.998291015625, -2.78125, -2.564208984375, -2.34716796875, -2.130126953125, -1.9130859375, -1.696044921875, -1.47900390625, -1.261962890625, -1.044921875, -0.827880859375, -0.61083984375, -0.393798828125, -0.1767578125, 0.040283203125, 0.25732421875, 0.474365234375, 0.69140625, 0.908447265625, 1.12548828125, 1.342529296875, 1.5595703125, 1.776611328125, 1.99365234375, 2.210693359375, 2.427734375, 2.644775390625, 2.86181640625, 3.078857421875, 3.2958984375, 3.512939453125, 3.72998046875, 3.947021484375, 4.1640625, 4.381103515625, 4.59814453125, 4.815185546875, 5.0322265625, 5.249267578125, 5.46630859375, 5.683349609375, 5.900390625, 6.117431640625, 6.33447265625, 6.551513671875, 6.7685546875, 6.985595703125, 7.20263671875, 7.419677734375, 7.63671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 8.0, 15.0, 12.0, 30.0, 44.0, 50.0, 138.0, 399.0, 1955.0, 13733.0, 198038.0, 780760.0, 47027.0, 5042.0, 889.0, 206.0, 79.0, 41.0, 19.0, 15.0, 13.0, 7.0, 6.0, 6.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.146484375, -2.085601806640625, -2.02471923828125, -1.963836669921875, -1.9029541015625, -1.842071533203125, -1.78118896484375, -1.720306396484375, -1.659423828125, -1.598541259765625, -1.53765869140625, -1.476776123046875, -1.4158935546875, -1.355010986328125, -1.29412841796875, -1.233245849609375, -1.17236328125, -1.111480712890625, -1.05059814453125, -0.989715576171875, -0.9288330078125, -0.867950439453125, -0.80706787109375, -0.746185302734375, -0.685302734375, -0.624420166015625, -0.56353759765625, -0.502655029296875, -0.4417724609375, -0.380889892578125, -0.32000732421875, -0.259124755859375, -0.1982421875, -0.137359619140625, -0.07647705078125, -0.015594482421875, 0.0452880859375, 0.106170654296875, 0.16705322265625, 0.227935791015625, 0.288818359375, 0.349700927734375, 0.41058349609375, 0.471466064453125, 0.5323486328125, 0.593231201171875, 0.65411376953125, 0.714996337890625, 0.77587890625, 0.836761474609375, 0.89764404296875, 0.958526611328125, 1.0194091796875, 1.080291748046875, 1.14117431640625, 1.202056884765625, 1.262939453125, 1.323822021484375, 1.38470458984375, 1.445587158203125, 1.5064697265625, 1.567352294921875, 1.62823486328125, 1.689117431640625, 1.75]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 12.0, 6.0, 11.0, 26.0, 32.0, 40.0, 74.0, 84.0, 136.0, 191.0, 121.0, 83.0, 44.0, 37.0, 32.0, 11.0, 17.0, 10.0, 7.0, 5.0, 2.0, 3.0, 4.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0002899169921875, -0.00028253719210624695, -0.0002751573920249939, -0.00026777759194374084, -0.0002603977918624878, -0.00025301799178123474, -0.0002456381916999817, -0.00023825839161872864, -0.00023087859153747559, -0.00022349879145622253, -0.00021611899137496948, -0.00020873919129371643, -0.00020135939121246338, -0.00019397959113121033, -0.00018659979104995728, -0.00017921999096870422, -0.00017184019088745117, -0.00016446039080619812, -0.00015708059072494507, -0.00014970079064369202, -0.00014232099056243896, -0.0001349411904811859, -0.00012756139039993286, -0.00012018159031867981, -0.00011280179023742676, -0.0001054219901561737, -9.804219007492065e-05, -9.06623899936676e-05, -8.328258991241455e-05, -7.59027898311615e-05, -6.852298974990845e-05, -6.11431896686554e-05, -5.3763389587402344e-05, -4.638358950614929e-05, -3.900378942489624e-05, -3.162398934364319e-05, -2.4244189262390137e-05, -1.6864389181137085e-05, -9.484589099884033e-06, -2.1047890186309814e-06, 5.27501106262207e-06, 1.2654811143875122e-05, 2.0034611225128174e-05, 2.7414411306381226e-05, 3.479421138763428e-05, 4.217401146888733e-05, 4.955381155014038e-05, 5.693361163139343e-05, 6.431341171264648e-05, 7.169321179389954e-05, 7.907301187515259e-05, 8.645281195640564e-05, 9.383261203765869e-05, 0.00010121241211891174, 0.0001085922122001648, 0.00011597201228141785, 0.0001233518123626709, 0.00013073161244392395, 0.000138111412525177, 0.00014549121260643005, 0.0001528710126876831, 0.00016025081276893616, 0.0001676306128501892, 0.00017501041293144226, 0.0001823902130126953]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 10.0, 10.0, 14.0, 28.0, 31.0, 51.0, 111.0, 181.0, 335.0, 738.0, 1802.0, 5877.0, 25980.0, 168766.0, 663766.0, 149340.0, 22999.0, 5312.0, 1729.0, 682.0, 352.0, 182.0, 102.0, 43.0, 44.0, 21.0, 13.0, 11.0, 12.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0479888916015625, -1.005157470703125, -0.9623260498046875, -0.91949462890625, -0.8766632080078125, -0.833831787109375, -0.7910003662109375, -0.7481689453125, -0.7053375244140625, -0.662506103515625, -0.6196746826171875, -0.57684326171875, -0.5340118408203125, -0.491180419921875, -0.4483489990234375, -0.405517578125, -0.3626861572265625, -0.319854736328125, -0.2770233154296875, -0.23419189453125, -0.1913604736328125, -0.148529052734375, -0.1056976318359375, -0.0628662109375, -0.0200347900390625, 0.022796630859375, 0.0656280517578125, 0.10845947265625, 0.1512908935546875, 0.194122314453125, 0.2369537353515625, 0.27978515625, 0.3226165771484375, 0.365447998046875, 0.4082794189453125, 0.45111083984375, 0.4939422607421875, 0.536773681640625, 0.5796051025390625, 0.6224365234375, 0.6652679443359375, 0.708099365234375, 0.7509307861328125, 0.79376220703125, 0.8365936279296875, 0.879425048828125, 0.9222564697265625, 0.965087890625, 1.0079193115234375, 1.050750732421875, 1.0935821533203125, 1.13641357421875, 1.1792449951171875, 1.222076416015625, 1.2649078369140625, 1.3077392578125, 1.3505706787109375, 1.393402099609375, 1.4362335205078125, 1.47906494140625, 1.5218963623046875, 1.564727783203125, 1.6075592041015625, 1.650390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 16.0, 1.0, 12.0, 23.0, 29.0, 40.0, 59.0, 64.0, 97.0, 154.0, 145.0, 98.0, 78.0, 59.0, 50.0, 29.0, 23.0, 14.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9462890625, -0.92205810546875, -0.8978271484375, -0.87359619140625, -0.849365234375, -0.82513427734375, -0.8009033203125, -0.77667236328125, -0.75244140625, -0.72821044921875, -0.7039794921875, -0.67974853515625, -0.655517578125, -0.63128662109375, -0.6070556640625, -0.58282470703125, -0.55859375, -0.53436279296875, -0.5101318359375, -0.48590087890625, -0.461669921875, -0.43743896484375, -0.4132080078125, -0.38897705078125, -0.36474609375, -0.34051513671875, -0.3162841796875, -0.29205322265625, -0.267822265625, -0.24359130859375, -0.2193603515625, -0.19512939453125, -0.1708984375, -0.14666748046875, -0.1224365234375, -0.09820556640625, -0.073974609375, -0.04974365234375, -0.0255126953125, -0.00128173828125, 0.02294921875, 0.04718017578125, 0.0714111328125, 0.09564208984375, 0.119873046875, 0.14410400390625, 0.1683349609375, 0.19256591796875, 0.216796875, 0.24102783203125, 0.2652587890625, 0.28948974609375, 0.313720703125, 0.33795166015625, 0.3621826171875, 0.38641357421875, 0.41064453125, 0.43487548828125, 0.4591064453125, 0.48333740234375, 0.507568359375, 0.53179931640625, 0.5560302734375, 0.58026123046875, 0.6044921875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 13.0, 10.0, 22.0, 41.0, 47.0, 83.0, 103.0, 126.0, 130.0, 140.0, 94.0, 83.0, 47.0, 30.0, 22.0, 10.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.41785717010498, -10.076034545898438, -9.734212875366211, -9.392390251159668, -9.050567626953125, -8.708745956420898, -8.366923332214355, -8.025100708007812, -7.683279037475586, -7.341456890106201, -6.999634742736816, -6.657812118530273, -6.315989971160889, -5.974167823791504, -5.632345199584961, -5.290523052215576, -4.948700904846191, -4.606878757476807, -4.265056610107422, -3.923233985900879, -3.581411838531494, -3.2395896911621094, -2.8977673053741455, -2.5559449195861816, -2.214122772216797, -1.8723005056381226, -1.5304782390594482, -1.188655972480774, -0.8468337059020996, -0.5050114393234253, -0.16318917274475098, 0.1786332130432129, 0.5204553604125977, 0.862277626991272, 1.2040998935699463, 1.5459221601486206, 1.887744426727295, 2.2295665740966797, 2.5713889598846436, 2.9132113456726074, 3.255033493041992, 3.596855640411377, 3.938678026199341, 4.280500411987305, 4.6223225593566895, 4.964144706726074, 5.305967330932617, 5.647789478302002, 5.989611625671387, 6.3314337730407715, 6.673255920410156, 7.015078544616699, 7.356900691986084, 7.698722839355469, 8.040545463562012, 8.382368087768555, 8.724189758300781, 9.066012382507324, 9.40783405303955, 9.749656677246094, 10.09147834777832, 10.433300971984863, 10.775123596191406, 11.116945266723633, 11.458767890930176]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 9.0, 8.0, 10.0, 7.0, 11.0, 22.0, 20.0, 25.0, 21.0, 30.0, 28.0, 42.0, 41.0, 41.0, 59.0, 38.0, 54.0, 37.0, 59.0, 47.0, 49.0, 35.0, 41.0, 28.0, 34.0, 36.0, 18.0, 33.0, 16.0, 19.0, 16.0, 12.0, 16.0, 9.0, 7.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-11.993329048156738, -11.681588172912598, -11.369847297668457, -11.058106422424316, -10.746365547180176, -10.434624671936035, -10.122883796691895, -9.811142921447754, -9.499402046203613, -9.187661170959473, -8.875920295715332, -8.564179420471191, -8.25243854522705, -7.94069766998291, -7.6289567947387695, -7.317215919494629, -7.005475044250488, -6.693734169006348, -6.381993293762207, -6.070252418518066, -5.758511543273926, -5.446770668029785, -5.1350297927856445, -4.823288917541504, -4.511548042297363, -4.199807167053223, -3.888066291809082, -3.5763254165649414, -3.264584541320801, -2.95284366607666, -2.6411027908325195, -2.329361915588379, -2.0176210403442383, -1.7058801651000977, -1.394139289855957, -1.0823984146118164, -0.7706575393676758, -0.45891666412353516, -0.14717578887939453, 0.1645650863647461, 0.4763059616088867, 0.7880468368530273, 1.099787712097168, 1.4115285873413086, 1.7232694625854492, 2.03501033782959, 2.3467512130737305, 2.658492088317871, 2.9702329635620117, 3.2819738388061523, 3.593714714050293, 3.9054555892944336, 4.217196464538574, 4.528937339782715, 4.8406782150268555, 5.152419090270996, 5.464159965515137, 5.775900840759277, 6.087641716003418, 6.399382591247559, 6.711123466491699, 7.02286434173584, 7.3346052169799805, 7.646346092224121, 7.958086967468262]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 8.0, 11.0, 12.0, 15.0, 26.0, 31.0, 33.0, 48.0, 73.0, 126.0, 205.0, 347.0, 673.0, 1603.0, 4264.0, 16446.0, 142702.0, 3569547.0, 419988.0, 27313.0, 6744.0, 2101.0, 805.0, 467.0, 227.0, 126.0, 87.0, 72.0, 46.0, 35.0, 20.0, 19.0, 12.0, 12.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.828125, -8.59356689453125, -8.3590087890625, -8.12445068359375, -7.889892578125, -7.65533447265625, -7.4207763671875, -7.18621826171875, -6.95166015625, -6.71710205078125, -6.4825439453125, -6.24798583984375, -6.013427734375, -5.77886962890625, -5.5443115234375, -5.30975341796875, -5.0751953125, -4.84063720703125, -4.6060791015625, -4.37152099609375, -4.136962890625, -3.90240478515625, -3.6678466796875, -3.43328857421875, -3.19873046875, -2.96417236328125, -2.7296142578125, -2.49505615234375, -2.260498046875, -2.02593994140625, -1.7913818359375, -1.55682373046875, -1.322265625, -1.08770751953125, -0.8531494140625, -0.61859130859375, -0.384033203125, -0.14947509765625, 0.0850830078125, 0.31964111328125, 0.55419921875, 0.78875732421875, 1.0233154296875, 1.25787353515625, 1.492431640625, 1.72698974609375, 1.9615478515625, 2.19610595703125, 2.4306640625, 2.66522216796875, 2.8997802734375, 3.13433837890625, 3.368896484375, 3.60345458984375, 3.8380126953125, 4.07257080078125, 4.30712890625, 4.54168701171875, 4.7762451171875, 5.01080322265625, 5.245361328125, 5.47991943359375, 5.7144775390625, 5.94903564453125, 6.18359375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 8.0, 11.0, 26.0, 28.0, 44.0, 58.0, 64.0, 77.0, 66.0, 113.0, 92.0, 83.0, 72.0, 69.0, 58.0, 44.0, 29.0, 21.0, 15.0, 6.0, 5.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.23046875, -5.096405029296875, -4.96234130859375, -4.828277587890625, -4.6942138671875, -4.560150146484375, -4.42608642578125, -4.292022705078125, -4.157958984375, -4.023895263671875, -3.88983154296875, -3.755767822265625, -3.6217041015625, -3.487640380859375, -3.35357666015625, -3.219512939453125, -3.08544921875, -2.951385498046875, -2.81732177734375, -2.683258056640625, -2.5491943359375, -2.415130615234375, -2.28106689453125, -2.147003173828125, -2.012939453125, -1.878875732421875, -1.74481201171875, -1.610748291015625, -1.4766845703125, -1.342620849609375, -1.20855712890625, -1.074493408203125, -0.9404296875, -0.806365966796875, -0.67230224609375, -0.538238525390625, -0.4041748046875, -0.270111083984375, -0.13604736328125, -0.001983642578125, 0.132080078125, 0.266143798828125, 0.40020751953125, 0.534271240234375, 0.6683349609375, 0.802398681640625, 0.93646240234375, 1.070526123046875, 1.20458984375, 1.338653564453125, 1.47271728515625, 1.606781005859375, 1.7408447265625, 1.874908447265625, 2.00897216796875, 2.143035888671875, 2.277099609375, 2.411163330078125, 2.54522705078125, 2.679290771484375, 2.8133544921875, 2.947418212890625, 3.08148193359375, 3.215545654296875, 3.349609375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 7.0, 8.0, 11.0, 21.0, 33.0, 44.0, 68.0, 139.0, 339.0, 1126.0, 6032.0, 133551.0, 3983977.0, 63343.0, 4159.0, 796.0, 325.0, 110.0, 65.0, 37.0, 24.0, 15.0, 12.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.203125, -10.834716796875, -10.46630859375, -10.097900390625, -9.7294921875, -9.361083984375, -8.99267578125, -8.624267578125, -8.255859375, -7.887451171875, -7.51904296875, -7.150634765625, -6.7822265625, -6.413818359375, -6.04541015625, -5.677001953125, -5.30859375, -4.940185546875, -4.57177734375, -4.203369140625, -3.8349609375, -3.466552734375, -3.09814453125, -2.729736328125, -2.361328125, -1.992919921875, -1.62451171875, -1.256103515625, -0.8876953125, -0.519287109375, -0.15087890625, 0.217529296875, 0.5859375, 0.954345703125, 1.32275390625, 1.691162109375, 2.0595703125, 2.427978515625, 2.79638671875, 3.164794921875, 3.533203125, 3.901611328125, 4.27001953125, 4.638427734375, 5.0068359375, 5.375244140625, 5.74365234375, 6.112060546875, 6.48046875, 6.848876953125, 7.21728515625, 7.585693359375, 7.9541015625, 8.322509765625, 8.69091796875, 9.059326171875, 9.427734375, 9.796142578125, 10.16455078125, 10.532958984375, 10.9013671875, 11.269775390625, 11.63818359375, 12.006591796875, 12.375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 8.0, 15.0, 23.0, 38.0, 61.0, 78.0, 150.0, 245.0, 428.0, 736.0, 801.0, 655.0, 317.0, 193.0, 119.0, 58.0, 48.0, 22.0, 19.0, 12.0, 7.0, 9.0, 5.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.985260009765625, -1.92559814453125, -1.865936279296875, -1.8062744140625, -1.746612548828125, -1.68695068359375, -1.627288818359375, -1.567626953125, -1.507965087890625, -1.44830322265625, -1.388641357421875, -1.3289794921875, -1.269317626953125, -1.20965576171875, -1.149993896484375, -1.09033203125, -1.030670166015625, -0.97100830078125, -0.911346435546875, -0.8516845703125, -0.792022705078125, -0.73236083984375, -0.672698974609375, -0.613037109375, -0.553375244140625, -0.49371337890625, -0.434051513671875, -0.3743896484375, -0.314727783203125, -0.25506591796875, -0.195404052734375, -0.1357421875, -0.076080322265625, -0.01641845703125, 0.043243408203125, 0.1029052734375, 0.162567138671875, 0.22222900390625, 0.281890869140625, 0.341552734375, 0.401214599609375, 0.46087646484375, 0.520538330078125, 0.5802001953125, 0.639862060546875, 0.69952392578125, 0.759185791015625, 0.81884765625, 0.878509521484375, 0.93817138671875, 0.997833251953125, 1.0574951171875, 1.117156982421875, 1.17681884765625, 1.236480712890625, 1.296142578125, 1.355804443359375, 1.41546630859375, 1.475128173828125, 1.5347900390625, 1.594451904296875, 1.65411376953125, 1.713775634765625, 1.7734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 3.0, 7.0, 6.0, 11.0, 19.0, 26.0, 41.0, 55.0, 59.0, 63.0, 81.0, 84.0, 97.0, 89.0, 71.0, 62.0, 44.0, 49.0, 33.0, 19.0, 32.0, 20.0, 6.0, 11.0, 10.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8258464336395264, -2.6834685802459717, -2.541090965270996, -2.3987131118774414, -2.256335496902466, -2.113957643508911, -1.971579909324646, -1.8292021751403809, -1.6868244409561157, -1.5444467067718506, -1.4020689725875854, -1.2596912384033203, -1.1173133850097656, -0.9749357104301453, -0.8325579166412354, -0.6901801824569702, -0.5478024482727051, -0.40542471408843994, -0.2630469501018524, -0.12066918611526489, 0.021708548069000244, 0.16408628225326538, 0.3064640760421753, 0.44884181022644043, 0.5912195444107056, 0.7335972785949707, 0.8759750127792358, 1.018352746963501, 1.1607306003570557, 1.3031082153320312, 1.445486068725586, 1.587863802909851, 1.730241298675537, 1.8726190328598022, 2.0149967670440674, 2.157374620437622, 2.2997522354125977, 2.4421300888061523, 2.584507942199707, 2.7268855571746826, 2.869263172149658, 3.011641025543213, 3.1540186405181885, 3.296396493911743, 3.4387741088867188, 3.5811519622802734, 3.723529815673828, 3.8659074306488037, 4.0082855224609375, 4.150663375854492, 4.293041229248047, 4.435418605804443, 4.577796459197998, 4.720174312591553, 4.862552165985107, 5.004929542541504, 5.147307395935059, 5.289685249328613, 5.432063102722168, 5.5744404792785645, 5.716818332672119, 5.859196186065674, 6.0015740394592285, 6.143951416015625, 6.28632926940918]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 1.0, 5.0, 6.0, 8.0, 5.0, 15.0, 16.0, 14.0, 24.0, 24.0, 31.0, 19.0, 27.0, 40.0, 42.0, 47.0, 54.0, 41.0, 43.0, 42.0, 44.0, 29.0, 50.0, 50.0, 43.0, 47.0, 36.0, 26.0, 37.0, 24.0, 22.0, 13.0, 15.0, 19.0, 8.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8028488159179688, -2.707266330718994, -2.6116836071014404, -2.5161008834838867, -2.420518398284912, -2.3249359130859375, -2.229353189468384, -2.13377046585083, -2.0381879806518555, -1.9426053762435913, -1.8470227718353271, -1.751440167427063, -1.6558575630187988, -1.5602749586105347, -1.4646923542022705, -1.3691097497940063, -1.2735271453857422, -1.177944540977478, -1.0823619365692139, -0.9867793321609497, -0.8911967277526855, -0.7956141233444214, -0.7000315189361572, -0.6044489145278931, -0.5088663101196289, -0.41328370571136475, -0.3177011013031006, -0.22211849689483643, -0.12653589248657227, -0.030953288078308105, 0.06462931632995605, 0.16021192073822021, 0.2557945251464844, 0.35137712955474854, 0.4469597339630127, 0.5425423383712769, 0.638124942779541, 0.7337075471878052, 0.8292901515960693, 0.9248727560043335, 1.0204553604125977, 1.1160379648208618, 1.211620569229126, 1.3072031736373901, 1.4027857780456543, 1.4983683824539185, 1.5939509868621826, 1.6895335912704468, 1.785116195678711, 1.880698800086975, 1.9762814044952393, 2.071864128112793, 2.1674466133117676, 2.263029098510742, 2.358611822128296, 2.4541945457458496, 2.549777030944824, 2.645359516143799, 2.7409422397613525, 2.8365249633789062, 2.932107448577881, 3.0276899337768555, 3.123272657394409, 3.218855381011963, 3.3144378662109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 15.0, 12.0, 18.0, 46.0, 58.0, 77.0, 125.0, 167.0, 264.0, 407.0, 706.0, 1193.0, 2207.0, 4014.0, 8242.0, 20164.0, 75075.0, 355398.0, 434058.0, 101656.0, 24751.0, 9379.0, 4552.0, 2496.0, 1369.0, 787.0, 458.0, 308.0, 178.0, 105.0, 70.0, 51.0, 35.0, 26.0, 21.0, 12.0, 9.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0703125, -1.0379714965820312, -1.0056304931640625, -0.9732894897460938, -0.940948486328125, -0.9086074829101562, -0.8762664794921875, -0.8439254760742188, -0.81158447265625, -0.7792434692382812, -0.7469024658203125, -0.7145614624023438, -0.682220458984375, -0.6498794555664062, -0.6175384521484375, -0.5851974487304688, -0.5528564453125, -0.5205154418945312, -0.4881744384765625, -0.45583343505859375, -0.423492431640625, -0.39115142822265625, -0.3588104248046875, -0.32646942138671875, -0.29412841796875, -0.26178741455078125, -0.2294464111328125, -0.19710540771484375, -0.164764404296875, -0.13242340087890625, -0.1000823974609375, -0.06774139404296875, -0.035400390625, -0.00305938720703125, 0.0292816162109375, 0.06162261962890625, 0.093963623046875, 0.12630462646484375, 0.1586456298828125, 0.19098663330078125, 0.22332763671875, 0.25566864013671875, 0.2880096435546875, 0.32035064697265625, 0.352691650390625, 0.38503265380859375, 0.4173736572265625, 0.44971466064453125, 0.4820556640625, 0.5143966674804688, 0.5467376708984375, 0.5790786743164062, 0.611419677734375, 0.6437606811523438, 0.6761016845703125, 0.7084426879882812, 0.74078369140625, 0.7731246948242188, 0.8054656982421875, 0.8378067016601562, 0.870147705078125, 0.9024887084960938, 0.9348297119140625, 0.9671707153320312, 0.99951171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 4.0, 9.0, 4.0, 8.0, 14.0, 13.0, 19.0, 19.0, 25.0, 28.0, 23.0, 34.0, 36.0, 47.0, 46.0, 52.0, 56.0, 43.0, 50.0, 37.0, 50.0, 54.0, 44.0, 32.0, 39.0, 41.0, 25.0, 30.0, 19.0, 17.0, 15.0, 21.0, 11.0, 11.0, 9.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.96484375, -1.902099609375, -1.83935546875, -1.776611328125, -1.7138671875, -1.651123046875, -1.58837890625, -1.525634765625, -1.462890625, -1.400146484375, -1.33740234375, -1.274658203125, -1.2119140625, -1.149169921875, -1.08642578125, -1.023681640625, -0.9609375, -0.898193359375, -0.83544921875, -0.772705078125, -0.7099609375, -0.647216796875, -0.58447265625, -0.521728515625, -0.458984375, -0.396240234375, -0.33349609375, -0.270751953125, -0.2080078125, -0.145263671875, -0.08251953125, -0.019775390625, 0.04296875, 0.105712890625, 0.16845703125, 0.231201171875, 0.2939453125, 0.356689453125, 0.41943359375, 0.482177734375, 0.544921875, 0.607666015625, 0.67041015625, 0.733154296875, 0.7958984375, 0.858642578125, 0.92138671875, 0.984130859375, 1.046875, 1.109619140625, 1.17236328125, 1.235107421875, 1.2978515625, 1.360595703125, 1.42333984375, 1.486083984375, 1.548828125, 1.611572265625, 1.67431640625, 1.737060546875, 1.7998046875, 1.862548828125, 1.92529296875, 1.988037109375, 2.05078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 10.0, 10.0, 7.0, 21.0, 19.0, 39.0, 71.0, 110.0, 191.0, 422.0, 835.0, 1961.0, 5555.0, 19679.0, 147287.0, 694384.0, 148331.0, 20322.0, 5537.0, 1974.0, 829.0, 448.0, 222.0, 93.0, 64.0, 43.0, 18.0, 11.0, 10.0, 5.0, 7.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.6845703125, -1.637115478515625, -1.58966064453125, -1.542205810546875, -1.4947509765625, -1.447296142578125, -1.39984130859375, -1.352386474609375, -1.304931640625, -1.257476806640625, -1.21002197265625, -1.162567138671875, -1.1151123046875, -1.067657470703125, -1.02020263671875, -0.972747802734375, -0.92529296875, -0.877838134765625, -0.83038330078125, -0.782928466796875, -0.7354736328125, -0.688018798828125, -0.64056396484375, -0.593109130859375, -0.545654296875, -0.498199462890625, -0.45074462890625, -0.403289794921875, -0.3558349609375, -0.308380126953125, -0.26092529296875, -0.213470458984375, -0.166015625, -0.118560791015625, -0.07110595703125, -0.023651123046875, 0.0238037109375, 0.071258544921875, 0.11871337890625, 0.166168212890625, 0.213623046875, 0.261077880859375, 0.30853271484375, 0.355987548828125, 0.4034423828125, 0.450897216796875, 0.49835205078125, 0.545806884765625, 0.59326171875, 0.640716552734375, 0.68817138671875, 0.735626220703125, 0.7830810546875, 0.830535888671875, 0.87799072265625, 0.925445556640625, 0.972900390625, 1.020355224609375, 1.06781005859375, 1.115264892578125, 1.1627197265625, 1.210174560546875, 1.25762939453125, 1.305084228515625, 1.3525390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 7.0, 8.0, 6.0, 8.0, 12.0, 22.0, 18.0, 26.0, 20.0, 14.0, 34.0, 37.0, 40.0, 36.0, 49.0, 50.0, 39.0, 46.0, 45.0, 52.0, 53.0, 53.0, 40.0, 37.0, 43.0, 27.0, 30.0, 31.0, 16.0, 15.0, 13.0, 12.0, 11.0, 5.0, 6.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.921875, -4.77215576171875, -4.6224365234375, -4.47271728515625, -4.322998046875, -4.17327880859375, -4.0235595703125, -3.87384033203125, -3.72412109375, -3.57440185546875, -3.4246826171875, -3.27496337890625, -3.125244140625, -2.97552490234375, -2.8258056640625, -2.67608642578125, -2.5263671875, -2.37664794921875, -2.2269287109375, -2.07720947265625, -1.927490234375, -1.77777099609375, -1.6280517578125, -1.47833251953125, -1.32861328125, -1.17889404296875, -1.0291748046875, -0.87945556640625, -0.729736328125, -0.58001708984375, -0.4302978515625, -0.28057861328125, -0.130859375, 0.01885986328125, 0.1685791015625, 0.31829833984375, 0.468017578125, 0.61773681640625, 0.7674560546875, 0.91717529296875, 1.06689453125, 1.21661376953125, 1.3663330078125, 1.51605224609375, 1.665771484375, 1.81549072265625, 1.9652099609375, 2.11492919921875, 2.2646484375, 2.41436767578125, 2.5640869140625, 2.71380615234375, 2.863525390625, 3.01324462890625, 3.1629638671875, 3.31268310546875, 3.46240234375, 3.61212158203125, 3.7618408203125, 3.91156005859375, 4.061279296875, 4.21099853515625, 4.3607177734375, 4.51043701171875, 4.66015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 13.0, 12.0, 45.0, 71.0, 141.0, 343.0, 794.0, 2727.0, 13122.0, 274261.0, 722880.0, 27859.0, 4250.0, 1211.0, 440.0, 194.0, 82.0, 47.0, 32.0, 16.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5498046875, -1.5081024169921875, -1.466400146484375, -1.4246978759765625, -1.38299560546875, -1.3412933349609375, -1.299591064453125, -1.2578887939453125, -1.2161865234375, -1.1744842529296875, -1.132781982421875, -1.0910797119140625, -1.04937744140625, -1.0076751708984375, -0.965972900390625, -0.9242706298828125, -0.882568359375, -0.8408660888671875, -0.799163818359375, -0.7574615478515625, -0.71575927734375, -0.6740570068359375, -0.632354736328125, -0.5906524658203125, -0.5489501953125, -0.5072479248046875, -0.465545654296875, -0.4238433837890625, -0.38214111328125, -0.3404388427734375, -0.298736572265625, -0.2570343017578125, -0.21533203125, -0.1736297607421875, -0.131927490234375, -0.0902252197265625, -0.04852294921875, -0.0068206787109375, 0.034881591796875, 0.0765838623046875, 0.1182861328125, 0.1599884033203125, 0.201690673828125, 0.2433929443359375, 0.28509521484375, 0.3267974853515625, 0.368499755859375, 0.4102020263671875, 0.451904296875, 0.4936065673828125, 0.535308837890625, 0.5770111083984375, 0.61871337890625, 0.6604156494140625, 0.702117919921875, 0.7438201904296875, 0.7855224609375, 0.8272247314453125, 0.868927001953125, 0.9106292724609375, 0.95233154296875, 0.9940338134765625, 1.035736083984375, 1.0774383544921875, 1.119140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 16.0, 16.0, 32.0, 48.0, 90.0, 135.0, 175.0, 152.0, 140.0, 81.0, 49.0, 22.0, 19.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005588531494140625, -0.0005445331335067749, -0.0005302131175994873, -0.0005158931016921997, -0.0005015730857849121, -0.0004872530698776245, -0.0004729330539703369, -0.0004586130380630493, -0.0004442930221557617, -0.0004299730062484741, -0.0004156529903411865, -0.0004013329744338989, -0.00038701295852661133, -0.00037269294261932373, -0.00035837292671203613, -0.00034405291080474854, -0.00032973289489746094, -0.00031541287899017334, -0.00030109286308288574, -0.00028677284717559814, -0.00027245283126831055, -0.00025813281536102295, -0.00024381279945373535, -0.00022949278354644775, -0.00021517276763916016, -0.00020085275173187256, -0.00018653273582458496, -0.00017221271991729736, -0.00015789270401000977, -0.00014357268810272217, -0.00012925267219543457, -0.00011493265628814697, -0.00010061264038085938, -8.629262447357178e-05, -7.197260856628418e-05, -5.765259265899658e-05, -4.3332576751708984e-05, -2.9012560844421387e-05, -1.4692544937133789e-05, -3.725290298461914e-07, 1.3947486877441406e-05, 2.8267502784729004e-05, 4.25875186920166e-05, 5.69075345993042e-05, 7.12275505065918e-05, 8.55475664138794e-05, 9.986758232116699e-05, 0.00011418759822845459, 0.0001285076141357422, 0.00014282763004302979, 0.00015714764595031738, 0.00017146766185760498, 0.00018578767776489258, 0.00020010769367218018, 0.00021442770957946777, 0.00022874772548675537, 0.00024306774139404297, 0.00025738775730133057, 0.00027170777320861816, 0.00028602778911590576, 0.00030034780502319336, 0.00031466782093048096, 0.00032898783683776855, 0.00034330785274505615, 0.00035762786865234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 10.0, 5.0, 12.0, 15.0, 30.0, 31.0, 43.0, 50.0, 84.0, 107.0, 172.0, 213.0, 335.0, 514.0, 799.0, 1209.0, 2164.0, 3709.0, 7454.0, 15042.0, 34700.0, 88371.0, 230465.0, 348954.0, 188121.0, 71402.0, 28118.0, 12290.0, 5907.0, 3066.0, 1813.0, 1114.0, 715.0, 483.0, 278.0, 196.0, 159.0, 95.0, 66.0, 51.0, 41.0, 37.0, 29.0, 23.0, 12.0, 10.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0], "bins": [-0.38232421875, -0.37087249755859375, -0.3594207763671875, -0.34796905517578125, -0.336517333984375, -0.32506561279296875, -0.3136138916015625, -0.30216217041015625, -0.29071044921875, -0.27925872802734375, -0.2678070068359375, -0.25635528564453125, -0.244903564453125, -0.23345184326171875, -0.2220001220703125, -0.21054840087890625, -0.1990966796875, -0.18764495849609375, -0.1761932373046875, -0.16474151611328125, -0.153289794921875, -0.14183807373046875, -0.1303863525390625, -0.11893463134765625, -0.10748291015625, -0.09603118896484375, -0.0845794677734375, -0.07312774658203125, -0.061676025390625, -0.05022430419921875, -0.0387725830078125, -0.02732086181640625, -0.015869140625, -0.00441741943359375, 0.0070343017578125, 0.01848602294921875, 0.029937744140625, 0.04138946533203125, 0.0528411865234375, 0.06429290771484375, 0.07574462890625, 0.08719635009765625, 0.0986480712890625, 0.11009979248046875, 0.121551513671875, 0.13300323486328125, 0.1444549560546875, 0.15590667724609375, 0.1673583984375, 0.17881011962890625, 0.1902618408203125, 0.20171356201171875, 0.213165283203125, 0.22461700439453125, 0.2360687255859375, 0.24752044677734375, 0.25897216796875, 0.27042388916015625, 0.2818756103515625, 0.29332733154296875, 0.304779052734375, 0.31623077392578125, 0.3276824951171875, 0.33913421630859375, 0.3505859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 7.0, 4.0, 16.0, 21.0, 22.0, 33.0, 44.0, 64.0, 78.0, 88.0, 101.0, 116.0, 107.0, 68.0, 70.0, 38.0, 36.0, 23.0, 14.0, 11.0, 10.0, 4.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185546875, -0.1793537139892578, -0.17316055297851562, -0.16696739196777344, -0.16077423095703125, -0.15458106994628906, -0.14838790893554688, -0.1421947479248047, -0.1360015869140625, -0.1298084259033203, -0.12361526489257812, -0.11742210388183594, -0.11122894287109375, -0.10503578186035156, -0.09884262084960938, -0.09264945983886719, -0.086456298828125, -0.08026313781738281, -0.07406997680664062, -0.06787681579589844, -0.06168365478515625, -0.05549049377441406, -0.049297332763671875, -0.04310417175292969, -0.0369110107421875, -0.030717849731445312, -0.024524688720703125, -0.018331527709960938, -0.01213836669921875, -0.0059452056884765625, 0.000247955322265625, 0.0064411163330078125, 0.01263427734375, 0.018827438354492188, 0.025020599365234375, 0.031213760375976562, 0.03740692138671875, 0.04360008239746094, 0.049793243408203125, 0.05598640441894531, 0.0621795654296875, 0.06837272644042969, 0.07456588745117188, 0.08075904846191406, 0.08695220947265625, 0.09314537048339844, 0.09933853149414062, 0.10553169250488281, 0.111724853515625, 0.11791801452636719, 0.12411117553710938, 0.13030433654785156, 0.13649749755859375, 0.14269065856933594, 0.14888381958007812, 0.1550769805908203, 0.1612701416015625, 0.1674633026123047, 0.17365646362304688, 0.17984962463378906, 0.18604278564453125, 0.19223594665527344, 0.19842910766601562, 0.2046222686767578, 0.2108154296875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 9.0, 9.0, 9.0, 13.0, 17.0, 23.0, 38.0, 44.0, 56.0, 70.0, 85.0, 79.0, 85.0, 86.0, 83.0, 52.0, 52.0, 49.0, 30.0, 27.0, 18.0, 16.0, 17.0, 5.0, 14.0, 3.0, 7.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029763698577881, -1.9478716850280762, -1.8659796714782715, -1.7840876579284668, -1.702195644378662, -1.6203036308288574, -1.5384116172790527, -1.456519603729248, -1.3746275901794434, -1.2927355766296387, -1.210843563079834, -1.1289515495300293, -1.0470595359802246, -0.9651675224304199, -0.8832755088806152, -0.8013834953308105, -0.7194914817810059, -0.6375994682312012, -0.5557074546813965, -0.4738154411315918, -0.3919234275817871, -0.3100314140319824, -0.22813940048217773, -0.14624738693237305, -0.06435537338256836, 0.017536640167236328, 0.09942865371704102, 0.1813206672668457, 0.2632126808166504, 0.3451046943664551, 0.42699670791625977, 0.5088887214660645, 0.5907809734344482, 0.6726729869842529, 0.7545650005340576, 0.8364570140838623, 0.918349027633667, 1.0002410411834717, 1.0821330547332764, 1.164025068283081, 1.2459170818328857, 1.3278090953826904, 1.4097011089324951, 1.4915931224822998, 1.5734851360321045, 1.6553771495819092, 1.7372691631317139, 1.8191611766815186, 1.9010531902313232, 1.982945203781128, 2.0648372173309326, 2.1467292308807373, 2.228621244430542, 2.3105132579803467, 2.3924052715301514, 2.474297285079956, 2.5561892986297607, 2.6380813121795654, 2.71997332572937, 2.801865339279175, 2.8837573528289795, 2.965649366378784, 3.047541379928589, 3.1294333934783936, 3.2113254070281982]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 8.0, 5.0, 7.0, 10.0, 10.0, 22.0, 18.0, 21.0, 27.0, 30.0, 21.0, 35.0, 42.0, 45.0, 38.0, 44.0, 38.0, 42.0, 52.0, 28.0, 40.0, 52.0, 38.0, 33.0, 32.0, 44.0, 28.0, 23.0, 31.0, 28.0, 11.0, 22.0, 13.0, 6.0, 11.0, 8.0, 7.0, 8.0, 7.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5782090425491333, -1.5229995250701904, -1.4677900075912476, -1.4125804901123047, -1.3573710918426514, -1.3021615743637085, -1.2469520568847656, -1.1917425394058228, -1.1365330219268799, -1.081323504447937, -1.0261139869689941, -0.970904529094696, -0.915695071220398, -0.8604855537414551, -0.8052760362625122, -0.7500665187835693, -0.694857120513916, -0.6396476030349731, -0.584438145160675, -0.5292286276817322, -0.4740191400051117, -0.4188096523284912, -0.36360013484954834, -0.30839064717292786, -0.2531811594963074, -0.1979716718196869, -0.1427621692419052, -0.08755266666412354, -0.03234317898750305, 0.02286630868911743, 0.0780758261680603, 0.1332853138446808, 0.18849468231201172, 0.2437041699886322, 0.2989136576652527, 0.35412317514419556, 0.40933266282081604, 0.4645421504974365, 0.5197516679763794, 0.5749611854553223, 0.6301706433296204, 0.6853801608085632, 0.7405896186828613, 0.7957991361618042, 0.8510086536407471, 0.9062181115150452, 0.961427628993988, 1.0166370868682861, 1.071846604347229, 1.1270561218261719, 1.1822656393051147, 1.2374751567840576, 1.292684555053711, 1.3478940725326538, 1.4031035900115967, 1.4583131074905396, 1.5135226249694824, 1.5687321424484253, 1.6239416599273682, 1.6791510581970215, 1.7343605756759644, 1.7895700931549072, 1.84477961063385, 1.899989128112793, 1.9551985263824463]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 5.0, 6.0, 7.0, 12.0, 20.0, 34.0, 42.0, 54.0, 86.0, 138.0, 200.0, 369.0, 699.0, 1316.0, 2670.0, 5867.0, 13411.0, 32577.0, 87471.0, 294361.0, 413303.0, 120741.0, 43414.0, 17387.0, 7486.0, 3325.0, 1635.0, 812.0, 442.0, 221.0, 134.0, 97.0, 67.0, 34.0, 34.0, 10.0, 21.0, 6.0, 8.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.875946044921875, -2.77728271484375, -2.678619384765625, -2.5799560546875, -2.481292724609375, -2.38262939453125, -2.283966064453125, -2.185302734375, -2.086639404296875, -1.98797607421875, -1.889312744140625, -1.7906494140625, -1.691986083984375, -1.59332275390625, -1.494659423828125, -1.39599609375, -1.297332763671875, -1.19866943359375, -1.100006103515625, -1.0013427734375, -0.902679443359375, -0.80401611328125, -0.705352783203125, -0.606689453125, -0.508026123046875, -0.40936279296875, -0.310699462890625, -0.2120361328125, -0.113372802734375, -0.01470947265625, 0.083953857421875, 0.1826171875, 0.281280517578125, 0.37994384765625, 0.478607177734375, 0.5772705078125, 0.675933837890625, 0.77459716796875, 0.873260498046875, 0.971923828125, 1.070587158203125, 1.16925048828125, 1.267913818359375, 1.3665771484375, 1.465240478515625, 1.56390380859375, 1.662567138671875, 1.76123046875, 1.859893798828125, 1.95855712890625, 2.057220458984375, 2.1558837890625, 2.254547119140625, 2.35321044921875, 2.451873779296875, 2.550537109375, 2.649200439453125, 2.74786376953125, 2.846527099609375, 2.9451904296875, 3.043853759765625, 3.14251708984375, 3.241180419921875, 3.33984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 1.0, 5.0, 4.0, 5.0, 10.0, 11.0, 8.0, 15.0, 22.0, 13.0, 26.0, 25.0, 43.0, 31.0, 25.0, 40.0, 39.0, 46.0, 44.0, 50.0, 43.0, 42.0, 45.0, 40.0, 39.0, 36.0, 36.0, 32.0, 31.0, 26.0, 29.0, 29.0, 22.0, 15.0, 16.0, 18.0, 3.0, 7.0, 10.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.072265625, -2.97308349609375, -2.8739013671875, -2.77471923828125, -2.675537109375, -2.57635498046875, -2.4771728515625, -2.37799072265625, -2.27880859375, -2.17962646484375, -2.0804443359375, -1.98126220703125, -1.882080078125, -1.78289794921875, -1.6837158203125, -1.58453369140625, -1.4853515625, -1.38616943359375, -1.2869873046875, -1.18780517578125, -1.088623046875, -0.98944091796875, -0.8902587890625, -0.79107666015625, -0.69189453125, -0.59271240234375, -0.4935302734375, -0.39434814453125, -0.295166015625, -0.19598388671875, -0.0968017578125, 0.00238037109375, 0.1015625, 0.20074462890625, 0.2999267578125, 0.39910888671875, 0.498291015625, 0.59747314453125, 0.6966552734375, 0.79583740234375, 0.89501953125, 0.99420166015625, 1.0933837890625, 1.19256591796875, 1.291748046875, 1.39093017578125, 1.4901123046875, 1.58929443359375, 1.6884765625, 1.78765869140625, 1.8868408203125, 1.98602294921875, 2.085205078125, 2.18438720703125, 2.2835693359375, 2.38275146484375, 2.48193359375, 2.58111572265625, 2.6802978515625, 2.77947998046875, 2.878662109375, 2.97784423828125, 3.0770263671875, 3.17620849609375, 3.275390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 7.0, 15.0, 24.0, 28.0, 29.0, 48.0, 86.0, 110.0, 187.0, 315.0, 608.0, 1382.0, 3259.0, 8458.0, 23785.0, 74124.0, 286278.0, 466461.0, 124995.0, 36844.0, 12853.0, 4798.0, 1902.0, 853.0, 399.0, 244.0, 153.0, 75.0, 66.0, 41.0, 25.0, 22.0, 15.0, 13.0, 9.0, 11.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.689453125, -3.57489013671875, -3.4603271484375, -3.34576416015625, -3.231201171875, -3.11663818359375, -3.0020751953125, -2.88751220703125, -2.77294921875, -2.65838623046875, -2.5438232421875, -2.42926025390625, -2.314697265625, -2.20013427734375, -2.0855712890625, -1.97100830078125, -1.8564453125, -1.74188232421875, -1.6273193359375, -1.51275634765625, -1.398193359375, -1.28363037109375, -1.1690673828125, -1.05450439453125, -0.93994140625, -0.82537841796875, -0.7108154296875, -0.59625244140625, -0.481689453125, -0.36712646484375, -0.2525634765625, -0.13800048828125, -0.0234375, 0.09112548828125, 0.2056884765625, 0.32025146484375, 0.434814453125, 0.54937744140625, 0.6639404296875, 0.77850341796875, 0.89306640625, 1.00762939453125, 1.1221923828125, 1.23675537109375, 1.351318359375, 1.46588134765625, 1.5804443359375, 1.69500732421875, 1.8095703125, 1.92413330078125, 2.0386962890625, 2.15325927734375, 2.267822265625, 2.38238525390625, 2.4969482421875, 2.61151123046875, 2.72607421875, 2.84063720703125, 2.9552001953125, 3.06976318359375, 3.184326171875, 3.29888916015625, 3.4134521484375, 3.52801513671875, 3.642578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 10.0, 11.0, 16.0, 9.0, 23.0, 20.0, 31.0, 28.0, 28.0, 45.0, 38.0, 39.0, 53.0, 36.0, 63.0, 57.0, 52.0, 48.0, 46.0, 45.0, 36.0, 43.0, 44.0, 24.0, 25.0, 16.0, 15.0, 14.0, 15.0, 8.0, 7.0, 11.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.52734375, -4.39605712890625, -4.2647705078125, -4.13348388671875, -4.002197265625, -3.87091064453125, -3.7396240234375, -3.60833740234375, -3.47705078125, -3.34576416015625, -3.2144775390625, -3.08319091796875, -2.951904296875, -2.82061767578125, -2.6893310546875, -2.55804443359375, -2.4267578125, -2.29547119140625, -2.1641845703125, -2.03289794921875, -1.901611328125, -1.77032470703125, -1.6390380859375, -1.50775146484375, -1.37646484375, -1.24517822265625, -1.1138916015625, -0.98260498046875, -0.851318359375, -0.72003173828125, -0.5887451171875, -0.45745849609375, -0.326171875, -0.19488525390625, -0.0635986328125, 0.06768798828125, 0.198974609375, 0.33026123046875, 0.4615478515625, 0.59283447265625, 0.72412109375, 0.85540771484375, 0.9866943359375, 1.11798095703125, 1.249267578125, 1.38055419921875, 1.5118408203125, 1.64312744140625, 1.7744140625, 1.90570068359375, 2.0369873046875, 2.16827392578125, 2.299560546875, 2.43084716796875, 2.5621337890625, 2.69342041015625, 2.82470703125, 2.95599365234375, 3.0872802734375, 3.21856689453125, 3.349853515625, 3.48114013671875, 3.6124267578125, 3.74371337890625, 3.875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 12.0, 21.0, 24.0, 30.0, 51.0, 68.0, 102.0, 145.0, 247.0, 362.0, 668.0, 1035.0, 1972.0, 3808.0, 7417.0, 14932.0, 32873.0, 81396.0, 221369.0, 406505.0, 163429.0, 61023.0, 25852.0, 12088.0, 6050.0, 3123.0, 1600.0, 915.0, 516.0, 291.0, 205.0, 132.0, 73.0, 66.0, 39.0, 33.0, 19.0, 13.0, 16.0, 3.0, 5.0, 7.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.5044174194335938, -0.4883270263671875, -0.47223663330078125, -0.456146240234375, -0.44005584716796875, -0.4239654541015625, -0.40787506103515625, -0.39178466796875, -0.37569427490234375, -0.3596038818359375, -0.34351348876953125, -0.327423095703125, -0.31133270263671875, -0.2952423095703125, -0.27915191650390625, -0.2630615234375, -0.24697113037109375, -0.2308807373046875, -0.21479034423828125, -0.198699951171875, -0.18260955810546875, -0.1665191650390625, -0.15042877197265625, -0.13433837890625, -0.11824798583984375, -0.1021575927734375, -0.08606719970703125, -0.069976806640625, -0.05388641357421875, -0.0377960205078125, -0.02170562744140625, -0.005615234375, 0.01047515869140625, 0.0265655517578125, 0.04265594482421875, 0.058746337890625, 0.07483673095703125, 0.0909271240234375, 0.10701751708984375, 0.12310791015625, 0.13919830322265625, 0.1552886962890625, 0.17137908935546875, 0.187469482421875, 0.20355987548828125, 0.2196502685546875, 0.23574066162109375, 0.2518310546875, 0.26792144775390625, 0.2840118408203125, 0.30010223388671875, 0.316192626953125, 0.33228302001953125, 0.3483734130859375, 0.36446380615234375, 0.38055419921875, 0.39664459228515625, 0.4127349853515625, 0.42882537841796875, 0.444915771484375, 0.46100616455078125, 0.4770965576171875, 0.49318695068359375, 0.50927734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 9.0, 7.0, 11.0, 16.0, 12.0, 21.0, 24.0, 38.0, 38.0, 47.0, 54.0, 62.0, 89.0, 93.0, 91.0, 61.0, 61.0, 50.0, 40.0, 38.0, 31.0, 20.0, 18.0, 16.0, 7.0, 10.0, 5.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00014019012451171875, -0.0001363418996334076, -0.00013249367475509644, -0.00012864544987678528, -0.00012479722499847412, -0.00012094900012016296, -0.0001171007752418518, -0.00011325255036354065, -0.00010940432548522949, -0.00010555610060691833, -0.00010170787572860718, -9.785965085029602e-05, -9.401142597198486e-05, -9.01632010936737e-05, -8.631497621536255e-05, -8.246675133705139e-05, -7.861852645874023e-05, -7.477030158042908e-05, -7.092207670211792e-05, -6.707385182380676e-05, -6.32256269454956e-05, -5.937740206718445e-05, -5.552917718887329e-05, -5.1680952310562134e-05, -4.7832727432250977e-05, -4.398450255393982e-05, -4.013627767562866e-05, -3.6288052797317505e-05, -3.243982791900635e-05, -2.859160304069519e-05, -2.4743378162384033e-05, -2.0895153284072876e-05, -1.704692840576172e-05, -1.3198703527450562e-05, -9.350478649139404e-06, -5.502253770828247e-06, -1.6540288925170898e-06, 2.1941959857940674e-06, 6.042420864105225e-06, 9.890645742416382e-06, 1.3738870620727539e-05, 1.7587095499038696e-05, 2.1435320377349854e-05, 2.528354525566101e-05, 2.9131770133972168e-05, 3.2979995012283325e-05, 3.682821989059448e-05, 4.067644476890564e-05, 4.45246696472168e-05, 4.8372894525527954e-05, 5.222111940383911e-05, 5.606934428215027e-05, 5.9917569160461426e-05, 6.376579403877258e-05, 6.761401891708374e-05, 7.14622437953949e-05, 7.531046867370605e-05, 7.915869355201721e-05, 8.300691843032837e-05, 8.685514330863953e-05, 9.070336818695068e-05, 9.455159306526184e-05, 9.8399817943573e-05, 0.00010224804282188416, 0.00010609626770019531]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 7.0, 6.0, 11.0, 9.0, 14.0, 14.0, 27.0, 31.0, 31.0, 67.0, 78.0, 111.0, 141.0, 242.0, 336.0, 528.0, 972.0, 1640.0, 2960.0, 6051.0, 13379.0, 32574.0, 91542.0, 304071.0, 404844.0, 117458.0, 39958.0, 16041.0, 7228.0, 3425.0, 1812.0, 1022.0, 626.0, 428.0, 280.0, 170.0, 115.0, 81.0, 63.0, 52.0, 24.0, 24.0, 21.0, 12.0, 11.0, 8.0, 8.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.78857421875, -0.7647552490234375, -0.740936279296875, -0.7171173095703125, -0.69329833984375, -0.6694793701171875, -0.645660400390625, -0.6218414306640625, -0.5980224609375, -0.5742034912109375, -0.550384521484375, -0.5265655517578125, -0.50274658203125, -0.4789276123046875, -0.455108642578125, -0.4312896728515625, -0.407470703125, -0.3836517333984375, -0.359832763671875, -0.3360137939453125, -0.31219482421875, -0.2883758544921875, -0.264556884765625, -0.2407379150390625, -0.2169189453125, -0.1930999755859375, -0.169281005859375, -0.1454620361328125, -0.12164306640625, -0.0978240966796875, -0.074005126953125, -0.0501861572265625, -0.0263671875, -0.0025482177734375, 0.021270751953125, 0.0450897216796875, 0.06890869140625, 0.0927276611328125, 0.116546630859375, 0.1403656005859375, 0.1641845703125, 0.1880035400390625, 0.211822509765625, 0.2356414794921875, 0.25946044921875, 0.2832794189453125, 0.307098388671875, 0.3309173583984375, 0.354736328125, 0.3785552978515625, 0.402374267578125, 0.4261932373046875, 0.45001220703125, 0.4738311767578125, 0.497650146484375, 0.5214691162109375, 0.5452880859375, 0.5691070556640625, 0.592926025390625, 0.6167449951171875, 0.64056396484375, 0.6643829345703125, 0.688201904296875, 0.7120208740234375, 0.73583984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 7.0, 15.0, 29.0, 36.0, 35.0, 55.0, 91.0, 118.0, 141.0, 119.0, 112.0, 73.0, 52.0, 20.0, 21.0, 20.0, 12.0, 5.0, 5.0, 8.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.75341796875, -0.7329635620117188, -0.7125091552734375, -0.6920547485351562, -0.671600341796875, -0.6511459350585938, -0.6306915283203125, -0.6102371215820312, -0.58978271484375, -0.5693283081054688, -0.5488739013671875, -0.5284194946289062, -0.507965087890625, -0.48751068115234375, -0.4670562744140625, -0.44660186767578125, -0.4261474609375, -0.40569305419921875, -0.3852386474609375, -0.36478424072265625, -0.344329833984375, -0.32387542724609375, -0.3034210205078125, -0.28296661376953125, -0.26251220703125, -0.24205780029296875, -0.2216033935546875, -0.20114898681640625, -0.180694580078125, -0.16024017333984375, -0.1397857666015625, -0.11933135986328125, -0.098876953125, -0.07842254638671875, -0.0579681396484375, -0.03751373291015625, -0.017059326171875, 0.00339508056640625, 0.0238494873046875, 0.04430389404296875, 0.06475830078125, 0.08521270751953125, 0.1056671142578125, 0.12612152099609375, 0.146575927734375, 0.16703033447265625, 0.1874847412109375, 0.20793914794921875, 0.2283935546875, 0.24884796142578125, 0.2693023681640625, 0.28975677490234375, 0.310211181640625, 0.33066558837890625, 0.3511199951171875, 0.37157440185546875, 0.39202880859375, 0.41248321533203125, 0.4329376220703125, 0.45339202880859375, 0.473846435546875, 0.49430084228515625, 0.5147552490234375, 0.5352096557617188, 0.5556640625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 19.0, 26.0, 61.0, 100.0, 151.0, 157.0, 174.0, 133.0, 75.0, 43.0, 26.0, 14.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6573333740234375, -7.322300910949707, -6.987267971038818, -6.652235507965088, -6.317202568054199, -5.982170104980469, -5.647137641906738, -5.312105178833008, -4.977072238922119, -4.642039775848389, -4.3070068359375, -3.9719743728637695, -3.63694167137146, -3.3019089698791504, -2.96687650680542, -2.6318438053131104, -2.296811103820801, -1.9617784023284912, -1.6267458200454712, -1.2917132377624512, -0.9566805362701416, -0.621647834777832, -0.28661537170410156, 0.04841732978820801, 0.3834500312805176, 0.7184826731681824, 1.0535153150558472, 1.3885478973388672, 1.7235805988311768, 2.0586133003234863, 2.393645763397217, 2.7286784648895264, 3.063711166381836, 3.3987438678741455, 3.733776569366455, 4.0688090324401855, 4.403841972351074, 4.738874435424805, 5.073906898498535, 5.408939361572266, 5.743972301483154, 6.079004764556885, 6.414037704467773, 6.749070167541504, 7.084102630615234, 7.419135570526123, 7.7541680335998535, 8.089200973510742, 8.424233436584473, 8.759265899658203, 9.094298362731934, 9.429330825805664, 9.764364242553711, 10.099396705627441, 10.434429168701172, 10.769461631774902, 11.104494094848633, 11.439526557922363, 11.774559020996094, 12.10959243774414, 12.444624900817871, 12.779657363891602, 13.114689826965332, 13.449722290039062, 13.78475570678711]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 2.0, 5.0, 5.0, 4.0, 10.0, 7.0, 16.0, 18.0, 15.0, 21.0, 26.0, 21.0, 29.0, 36.0, 28.0, 36.0, 23.0, 37.0, 39.0, 36.0, 32.0, 47.0, 37.0, 44.0, 42.0, 33.0, 27.0, 42.0, 32.0, 40.0, 27.0, 31.0, 16.0, 15.0, 27.0, 8.0, 18.0, 10.0, 11.0, 8.0, 13.0, 8.0, 2.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.685919284820557, -5.5085272789001465, -5.3311357498168945, -5.153743743896484, -4.976351737976074, -4.798959732055664, -4.621567726135254, -4.444176197052002, -4.266784191131592, -4.089392185211182, -3.9120004177093506, -3.7346086502075195, -3.5572166442871094, -3.379824638366699, -3.202432870864868, -3.025041103363037, -2.847649097442627, -2.670257091522217, -2.4928653240203857, -2.3154735565185547, -2.1380815505981445, -1.960689663887024, -1.7832977771759033, -1.6059058904647827, -1.428514003753662, -1.2511221170425415, -1.073730230331421, -0.8963383436203003, -0.7189464569091797, -0.5415545701980591, -0.3641626834869385, -0.18677079677581787, -0.009379386901855469, 0.16801249980926514, 0.34540438652038574, 0.5227962732315063, 0.700188159942627, 0.8775800466537476, 1.0549719333648682, 1.2323638200759888, 1.4097557067871094, 1.58714759349823, 1.7645394802093506, 1.9419313669204712, 2.119323253631592, 2.296715259552002, 2.474107027053833, 2.651498794555664, 2.828890800476074, 3.0062828063964844, 3.1836745738983154, 3.3610663414001465, 3.5384583473205566, 3.715850353240967, 3.893242120742798, 4.070633888244629, 4.248025894165039, 4.425417900085449, 4.602809906005859, 4.780201435089111, 4.9575934410095215, 5.134985446929932, 5.312376976013184, 5.489768981933594, 5.667160987854004]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 11.0, 13.0, 25.0, 15.0, 29.0, 38.0, 42.0, 65.0, 99.0, 81.0, 109.0, 144.0, 182.0, 226.0, 287.0, 382.0, 442.0, 549.0, 739.0, 1139.0, 1041031.0, 1250.0, 842.0, 567.0, 474.0, 383.0, 301.0, 235.0, 184.0, 165.0, 110.0, 91.0, 89.0, 66.0, 41.0, 32.0, 30.0, 17.0, 20.0, 18.0, 10.0, 8.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.7618536949157715, -7.51632022857666, -7.270786285400391, -7.025252819061279, -6.779719352722168, -6.534185409545898, -6.288651943206787, -6.043118476867676, -5.7975850105285645, -5.552051544189453, -5.306517601013184, -5.060984134674072, -4.815450668334961, -4.569916725158691, -4.32438325881958, -4.078849792480469, -3.8333160877227783, -3.587782382965088, -3.3422489166259766, -3.096715211868286, -2.851181745529175, -2.6056480407714844, -2.360114574432373, -2.1145808696746826, -1.8690472841262817, -1.6235136985778809, -1.37798011302948, -1.132446527481079, -0.8869128823280334, -0.6413792371749878, -0.3958456516265869, -0.15031206607818604, 0.09522151947021484, 0.3407551050186157, 0.5862886905670166, 0.8318223357200623, 1.0773558616638184, 1.3228895664215088, 1.5684231519699097, 1.8139567375183105, 2.059490203857422, 2.3050239086151123, 2.5505573749542236, 2.796091079711914, 3.0416245460510254, 3.287158250808716, 3.5326919555664062, 3.7782254219055176, 4.023758888244629, 4.26929235458374, 4.51482629776001, 4.760359764099121, 5.005893230438232, 5.251426696777344, 5.496960639953613, 5.742494106292725, 5.988028049468994, 6.2335615158081055, 6.479095458984375, 6.724628925323486, 6.970162391662598, 7.215696334838867, 7.4612298011779785, 7.70676326751709, 7.952296733856201]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 4.0, 14.0, 24.0, 51.0, 88.0, 298.0, 876.0, 2495.0, 8633.0, 51432112.0, 19684.0, 4545.0, 1590.0, 566.0, 183.0, 83.0, 33.0, 10.0, 10.0, 9.0, 3.0, 4.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.9190673828125, -64.31858825683594, -61.71810531616211, -59.11762237548828, -56.51714324951172, -53.91666030883789, -51.31617736816406, -48.7156982421875, -46.11521911621094, -43.51473617553711, -40.91425704956055, -38.31377410888672, -35.713294982910156, -33.11281204223633, -30.512331008911133, -27.911849975585938, -25.31136703491211, -22.710886001586914, -20.11040496826172, -17.50992202758789, -14.909441947937012, -12.308960914611816, -9.708478927612305, -7.107997894287109, -4.507516860961914, -1.9070355892181396, 0.6934456825256348, 3.2939271926879883, 5.894408226013184, 8.494889259338379, 11.09537124633789, 13.695852279663086, 16.29633331298828, 18.896814346313477, 21.497295379638672, 24.0977783203125, 26.698257446289062, 29.29874038696289, 31.899221420288086, 34.49970245361328, 37.100181579589844, 39.70066452026367, 42.301143646240234, 44.90162658691406, 47.502105712890625, 50.10258865356445, 52.70307159423828, 55.303550720214844, 57.90403366088867, 60.5045166015625, 63.10499572753906, 65.70547485351562, 68.30596160888672, 70.90644073486328, 73.50691986083984, 76.10740661621094, 78.7078857421875, 81.30836486816406, 83.90885162353516, 86.50933074951172, 89.10980987548828, 91.71028900146484, 94.31077575683594, 96.9112548828125, 99.51173400878906]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 8.0, 9.0, 14.0, 20.0, 32.0, 52.0, 104.0, 137.0, 257.0, 432.0, 797.0, 1439.0, 2847.0, 5296.0, 10457.0, 20563.0, 42282.0, 85533.0, 164565.0, 296450.0, 492685.0, 2642651.0, 1543378.0, 434078.0, 260250.0, 142409.0, 72752.0, 35519.0, 17572.0, 8801.0, 4545.0, 2382.0, 1298.0, 753.0, 389.0, 222.0, 154.0, 92.0, 56.0, 41.0, 23.0, 24.0, 13.0, 18.0, 12.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.515625, -5.32464599609375, -5.1336669921875, -4.94268798828125, -4.751708984375, -4.56072998046875, -4.3697509765625, -4.17877197265625, -3.98779296875, -3.79681396484375, -3.6058349609375, -3.41485595703125, -3.223876953125, -3.03289794921875, -2.8419189453125, -2.65093994140625, -2.4599609375, -2.26898193359375, -2.0780029296875, -1.88702392578125, -1.696044921875, -1.50506591796875, -1.3140869140625, -1.12310791015625, -0.93212890625, -0.74114990234375, -0.5501708984375, -0.35919189453125, -0.168212890625, 0.02276611328125, 0.2137451171875, 0.40472412109375, 0.595703125, 0.78668212890625, 0.9776611328125, 1.16864013671875, 1.359619140625, 1.55059814453125, 1.7415771484375, 1.93255615234375, 2.12353515625, 2.31451416015625, 2.5054931640625, 2.69647216796875, 2.887451171875, 3.07843017578125, 3.2694091796875, 3.46038818359375, 3.6513671875, 3.84234619140625, 4.0333251953125, 4.22430419921875, 4.415283203125, 4.60626220703125, 4.7972412109375, 4.98822021484375, 5.17919921875, 5.37017822265625, 5.5611572265625, 5.75213623046875, 5.943115234375, 6.13409423828125, 6.3250732421875, 6.51605224609375, 6.70703125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 18.0, 14.0, 18.0, 19.0, 16.0, 26.0, 24.0, 29.0, 28.0, 35.0, 36.0, 41.0, 43.0, 39.0, 66.0, 180.0, 700.0, 224.0, 61.0, 35.0, 40.0, 47.0, 36.0, 26.0, 35.0, 20.0, 21.0, 22.0, 15.0, 10.0, 13.0, 21.0, 9.0, 5.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.03125, -31.984375, -30.9375, -29.890625, -28.84375, -27.796875, -26.75, -25.703125, -24.65625, -23.609375, -22.5625, -21.515625, -20.46875, -19.421875, -18.375, -17.328125, -16.28125, -15.234375, -14.1875, -13.140625, -12.09375, -11.046875, -10.0, -8.953125, -7.90625, -6.859375, -5.8125, -4.765625, -3.71875, -2.671875, -1.625, -0.578125, 0.46875, 1.515625, 2.5625, 3.609375, 4.65625, 5.703125, 6.75, 7.796875, 8.84375, 9.890625, 10.9375, 11.984375, 13.03125, 14.078125, 15.125, 16.171875, 17.21875, 18.265625, 19.3125, 20.359375, 21.40625, 22.453125, 23.5, 24.546875, 25.59375, 26.640625, 27.6875, 28.734375, 29.78125, 30.828125, 31.875, 32.921875, 33.96875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 8.0, 12.0, 20.0, 47.0, 61.0, 150.0, 198.0, 346.0, 641.0, 1042.0, 1665.0, 2894.0, 4665.0, 7971.0, 13318.0, 21293.0, 33976.0, 53548.0, 79893.0, 118400.0, 164815.0, 217136.0, 269822.0, 414418.0, 2275983.0, 1380301.0, 329739.0, 253589.0, 199613.0, 149268.0, 104917.0, 70572.0, 46087.0, 29114.0, 17907.0, 11106.0, 6684.0, 4093.0, 2445.0, 1466.0, 908.0, 491.0, 344.0, 198.0, 120.0, 55.0, 44.0, 16.0, 15.0, 11.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.5625, -2.47662353515625, -2.3907470703125, -2.30487060546875, -2.218994140625, -2.13311767578125, -2.0472412109375, -1.96136474609375, -1.87548828125, -1.78961181640625, -1.7037353515625, -1.61785888671875, -1.531982421875, -1.44610595703125, -1.3602294921875, -1.27435302734375, -1.1884765625, -1.10260009765625, -1.0167236328125, -0.93084716796875, -0.844970703125, -0.75909423828125, -0.6732177734375, -0.58734130859375, -0.50146484375, -0.41558837890625, -0.3297119140625, -0.24383544921875, -0.157958984375, -0.07208251953125, 0.0137939453125, 0.09967041015625, 0.185546875, 0.27142333984375, 0.3572998046875, 0.44317626953125, 0.529052734375, 0.61492919921875, 0.7008056640625, 0.78668212890625, 0.87255859375, 0.95843505859375, 1.0443115234375, 1.13018798828125, 1.216064453125, 1.30194091796875, 1.3878173828125, 1.47369384765625, 1.5595703125, 1.64544677734375, 1.7313232421875, 1.81719970703125, 1.903076171875, 1.98895263671875, 2.0748291015625, 2.16070556640625, 2.24658203125, 2.33245849609375, 2.4183349609375, 2.50421142578125, 2.590087890625, 2.67596435546875, 2.7618408203125, 2.84771728515625, 2.93359375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 10.0, 11.0, 13.0, 11.0, 13.0, 11.0, 21.0, 23.0, 13.0, 15.0, 24.0, 16.0, 26.0, 22.0, 31.0, 37.0, 32.0, 35.0, 41.0, 53.0, 285.0, 661.0, 162.0, 44.0, 27.0, 34.0, 33.0, 35.0, 32.0, 35.0, 23.0, 23.0, 33.0, 22.0, 15.0, 22.0, 19.0, 10.0, 9.0, 9.0, 6.0, 8.0, 5.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-21.265625, -20.589599609375, -19.91357421875, -19.237548828125, -18.5615234375, -17.885498046875, -17.20947265625, -16.533447265625, -15.857421875, -15.181396484375, -14.50537109375, -13.829345703125, -13.1533203125, -12.477294921875, -11.80126953125, -11.125244140625, -10.44921875, -9.773193359375, -9.09716796875, -8.421142578125, -7.7451171875, -7.069091796875, -6.39306640625, -5.717041015625, -5.041015625, -4.364990234375, -3.68896484375, -3.012939453125, -2.3369140625, -1.660888671875, -0.98486328125, -0.308837890625, 0.3671875, 1.043212890625, 1.71923828125, 2.395263671875, 3.0712890625, 3.747314453125, 4.42333984375, 5.099365234375, 5.775390625, 6.451416015625, 7.12744140625, 7.803466796875, 8.4794921875, 9.155517578125, 9.83154296875, 10.507568359375, 11.18359375, 11.859619140625, 12.53564453125, 13.211669921875, 13.8876953125, 14.563720703125, 15.23974609375, 15.915771484375, 16.591796875, 17.267822265625, 17.94384765625, 18.619873046875, 19.2958984375, 19.971923828125, 20.64794921875, 21.323974609375, 22.0]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 14.0, 26.0, 33.0, 46.0, 67.0, 91.0, 129.0, 211.0, 335.0, 474.0, 749.0, 1274.0, 2379.0, 4708.0, 10972.0, 31234.0, 92321.0, 264714.0, 625188.0, 3997940.0, 751723.0, 325497.0, 116300.0, 39337.0, 13829.0, 5552.0, 2623.0, 1396.0, 774.0, 490.0, 324.0, 200.0, 140.0, 84.0, 56.0, 60.0, 32.0, 32.0, 22.0, 22.0, 8.0, 4.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.34765625, -7.122314453125, -6.89697265625, -6.671630859375, -6.4462890625, -6.220947265625, -5.99560546875, -5.770263671875, -5.544921875, -5.319580078125, -5.09423828125, -4.868896484375, -4.6435546875, -4.418212890625, -4.19287109375, -3.967529296875, -3.7421875, -3.516845703125, -3.29150390625, -3.066162109375, -2.8408203125, -2.615478515625, -2.39013671875, -2.164794921875, -1.939453125, -1.714111328125, -1.48876953125, -1.263427734375, -1.0380859375, -0.812744140625, -0.58740234375, -0.362060546875, -0.13671875, 0.088623046875, 0.31396484375, 0.539306640625, 0.7646484375, 0.989990234375, 1.21533203125, 1.440673828125, 1.666015625, 1.891357421875, 2.11669921875, 2.342041015625, 2.5673828125, 2.792724609375, 3.01806640625, 3.243408203125, 3.46875, 3.694091796875, 3.91943359375, 4.144775390625, 4.3701171875, 4.595458984375, 4.82080078125, 5.046142578125, 5.271484375, 5.496826171875, 5.72216796875, 5.947509765625, 6.1728515625, 6.398193359375, 6.62353515625, 6.848876953125, 7.07421875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 15.0, 12.0, 17.0, 12.0, 15.0, 24.0, 23.0, 38.0, 30.0, 43.0, 44.0, 38.0, 38.0, 43.0, 89.0, 603.0, 459.0, 64.0, 40.0, 43.0, 39.0, 40.0, 31.0, 31.0, 30.0, 32.0, 27.0, 19.0, 16.0, 10.0, 3.0, 11.0, 7.0, 8.0, 4.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.3125, -23.500732421875, -22.68896484375, -21.877197265625, -21.0654296875, -20.253662109375, -19.44189453125, -18.630126953125, -17.818359375, -17.006591796875, -16.19482421875, -15.383056640625, -14.5712890625, -13.759521484375, -12.94775390625, -12.135986328125, -11.32421875, -10.512451171875, -9.70068359375, -8.888916015625, -8.0771484375, -7.265380859375, -6.45361328125, -5.641845703125, -4.830078125, -4.018310546875, -3.20654296875, -2.394775390625, -1.5830078125, -0.771240234375, 0.04052734375, 0.852294921875, 1.6640625, 2.475830078125, 3.28759765625, 4.099365234375, 4.9111328125, 5.722900390625, 6.53466796875, 7.346435546875, 8.158203125, 8.969970703125, 9.78173828125, 10.593505859375, 11.4052734375, 12.217041015625, 13.02880859375, 13.840576171875, 14.65234375, 15.464111328125, 16.27587890625, 17.087646484375, 17.8994140625, 18.711181640625, 19.52294921875, 20.334716796875, 21.146484375, 21.958251953125, 22.77001953125, 23.581787109375, 24.3935546875, 25.205322265625, 26.01708984375, 26.828857421875, 27.640625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 10.0, 20.0, 53.0, 229.0, 444.0, 188.0, 39.0, 19.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.37144470214844, -80.42475891113281, -74.47806549072266, -68.53137969970703, -62.58469009399414, -56.63800048828125, -50.691314697265625, -44.744625091552734, -38.797935485839844, -32.85124588012695, -26.904558181762695, -20.957870483398438, -15.011180877685547, -9.064491271972656, -3.1178054809570312, 2.8288841247558594, 8.77557373046875, 14.722262382507324, 20.6689510345459, 26.615638732910156, 32.56232833862305, 38.50901794433594, 44.45570373535156, 50.40239334106445, 56.349082946777344, 62.295772552490234, 68.24246215820312, 74.18914794921875, 80.13583374023438, 86.08252716064453, 92.02921295166016, 97.97590637207031, 103.92257690429688, 109.8692626953125, 115.81595611572266, 121.76264190673828, 127.70933532714844, 133.65602111816406, 139.6027069091797, 145.5493927001953, 151.49609375, 157.44277954101562, 163.38946533203125, 169.33615112304688, 175.28285217285156, 181.2295379638672, 187.1762237548828, 193.12290954589844, 199.06959533691406, 205.0162811279297, 210.9629669189453, 216.90966796875, 222.85635375976562, 228.80303955078125, 234.74972534179688, 240.6964111328125, 246.64309692382812, 252.58978271484375, 258.5364685058594, 264.483154296875, 270.4298400878906, 276.37652587890625, 282.3232421875, 288.2699279785156, 294.21661376953125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 5.0, 5.0, 6.0, 2.0, 2.0, 9.0, 18.0, 14.0, 16.0, 19.0, 29.0, 38.0, 23.0, 42.0, 52.0, 39.0, 46.0, 61.0, 46.0, 42.0, 49.0, 47.0, 60.0, 47.0, 49.0, 31.0, 36.0, 38.0, 26.0, 16.0, 20.0, 14.0, 10.0, 11.0, 14.0, 11.0, 1.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.63560485839844, -55.57374572753906, -53.51188278198242, -51.45002365112305, -49.388160705566406, -47.32630157470703, -45.264442443847656, -43.202579498291016, -41.140716552734375, -39.078857421875, -37.01699447631836, -34.955135345458984, -32.893272399902344, -30.83141326904297, -28.76955223083496, -26.707691192626953, -24.645832061767578, -22.58397102355957, -20.522109985351562, -18.460250854492188, -16.398387908935547, -14.336527824401855, -12.274667739868164, -10.212806701660156, -8.150945663452148, -6.089084625244141, -4.027224063873291, -1.9653635025024414, 0.0964975357055664, 2.158358573913574, 4.220218658447266, 6.282079696655273, 8.343940734863281, 10.405801773071289, 12.467662811279297, 14.529522895812988, 16.591384887695312, 18.653244018554688, 20.715105056762695, 22.776966094970703, 24.83882713317871, 26.90068817138672, 28.962549209594727, 31.024410247802734, 33.08626937866211, 35.14813232421875, 37.209991455078125, 39.2718505859375, 41.33371353149414, 43.395572662353516, 45.457435607910156, 47.51929473876953, 49.58115768432617, 51.64301681518555, 53.70487976074219, 55.76673889160156, 57.82859802246094, 59.89045715332031, 61.95232009887695, 64.0141830444336, 66.07604217529297, 68.13790130615234, 70.19976043701172, 72.26162719726562, 74.323486328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 10.0, 5.0, 8.0, 11.0, 14.0, 8.0, 12.0, 16.0, 29.0, 42.0, 72.0, 109.0, 230.0, 324.0, 675.0, 1278.0, 2893.0, 7063.0, 22535.0, 183054.0, 2766829.0, 1122707.0, 62930.0, 14170.0, 5101.0, 2049.0, 984.0, 435.0, 228.0, 147.0, 90.0, 46.0, 48.0, 32.0, 29.0, 14.0, 17.0, 5.0, 10.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.2978515625, -1.258270263671875, -1.21868896484375, -1.179107666015625, -1.1395263671875, -1.099945068359375, -1.06036376953125, -1.020782470703125, -0.981201171875, -0.941619873046875, -0.90203857421875, -0.862457275390625, -0.8228759765625, -0.783294677734375, -0.74371337890625, -0.704132080078125, -0.66455078125, -0.624969482421875, -0.58538818359375, -0.545806884765625, -0.5062255859375, -0.466644287109375, -0.42706298828125, -0.387481689453125, -0.347900390625, -0.308319091796875, -0.26873779296875, -0.229156494140625, -0.1895751953125, -0.149993896484375, -0.11041259765625, -0.070831298828125, -0.03125, 0.008331298828125, 0.04791259765625, 0.087493896484375, 0.1270751953125, 0.166656494140625, 0.20623779296875, 0.245819091796875, 0.285400390625, 0.324981689453125, 0.36456298828125, 0.404144287109375, 0.4437255859375, 0.483306884765625, 0.52288818359375, 0.562469482421875, 0.60205078125, 0.641632080078125, 0.68121337890625, 0.720794677734375, 0.7603759765625, 0.799957275390625, 0.83953857421875, 0.879119873046875, 0.918701171875, 0.958282470703125, 0.99786376953125, 1.037445068359375, 1.0770263671875, 1.116607666015625, 1.15618896484375, 1.195770263671875, 1.2353515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 5.0, 6.0, 6.0, 3.0, 17.0, 11.0, 17.0, 18.0, 26.0, 43.0, 21.0, 42.0, 55.0, 54.0, 62.0, 56.0, 72.0, 62.0, 73.0, 63.0, 45.0, 50.0, 26.0, 31.0, 30.0, 18.0, 19.0, 16.0, 14.0, 15.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55029296875, -0.5324020385742188, -0.5145111083984375, -0.49662017822265625, -0.478729248046875, -0.46083831787109375, -0.4429473876953125, -0.42505645751953125, -0.40716552734375, -0.38927459716796875, -0.3713836669921875, -0.35349273681640625, -0.335601806640625, -0.31771087646484375, -0.2998199462890625, -0.28192901611328125, -0.2640380859375, -0.24614715576171875, -0.2282562255859375, -0.21036529541015625, -0.192474365234375, -0.17458343505859375, -0.1566925048828125, -0.13880157470703125, -0.12091064453125, -0.10301971435546875, -0.0851287841796875, -0.06723785400390625, -0.049346923828125, -0.03145599365234375, -0.0135650634765625, 0.00432586669921875, 0.022216796875, 0.04010772705078125, 0.0579986572265625, 0.07588958740234375, 0.093780517578125, 0.11167144775390625, 0.1295623779296875, 0.14745330810546875, 0.16534423828125, 0.18323516845703125, 0.2011260986328125, 0.21901702880859375, 0.236907958984375, 0.25479888916015625, 0.2726898193359375, 0.29058074951171875, 0.3084716796875, 0.32636260986328125, 0.3442535400390625, 0.36214447021484375, 0.380035400390625, 0.39792633056640625, 0.4158172607421875, 0.43370819091796875, 0.45159912109375, 0.46949005126953125, 0.4873809814453125, 0.5052719116210938, 0.523162841796875, 0.5410537719726562, 0.5589447021484375, 0.5768356323242188, 0.5947265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 9.0, 13.0, 25.0, 36.0, 46.0, 92.0, 159.0, 379.0, 1145.0, 7766.0, 244910.0, 3870322.0, 64126.0, 3912.0, 797.0, 269.0, 115.0, 49.0, 35.0, 13.0, 14.0, 5.0, 13.0, 1.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.259765625, -2.2008514404296875, -2.141937255859375, -2.0830230712890625, -2.02410888671875, -1.9651947021484375, -1.906280517578125, -1.8473663330078125, -1.7884521484375, -1.7295379638671875, -1.670623779296875, -1.6117095947265625, -1.55279541015625, -1.4938812255859375, -1.434967041015625, -1.3760528564453125, -1.317138671875, -1.2582244873046875, -1.199310302734375, -1.1403961181640625, -1.08148193359375, -1.0225677490234375, -0.963653564453125, -0.9047393798828125, -0.8458251953125, -0.7869110107421875, -0.727996826171875, -0.6690826416015625, -0.61016845703125, -0.5512542724609375, -0.492340087890625, -0.4334259033203125, -0.37451171875, -0.3155975341796875, -0.256683349609375, -0.1977691650390625, -0.13885498046875, -0.0799407958984375, -0.021026611328125, 0.0378875732421875, 0.0968017578125, 0.1557159423828125, 0.214630126953125, 0.2735443115234375, 0.33245849609375, 0.3913726806640625, 0.450286865234375, 0.5092010498046875, 0.568115234375, 0.6270294189453125, 0.685943603515625, 0.7448577880859375, 0.80377197265625, 0.8626861572265625, 0.921600341796875, 0.9805145263671875, 1.0394287109375, 1.0983428955078125, 1.157257080078125, 1.2161712646484375, 1.27508544921875, 1.3339996337890625, 1.392913818359375, 1.4518280029296875, 1.5107421875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 10.0, 28.0, 28.0, 63.0, 140.0, 218.0, 502.0, 909.0, 933.0, 592.0, 285.0, 152.0, 80.0, 54.0, 18.0, 20.0, 10.0, 10.0, 8.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0263671875, -0.997039794921875, -0.96771240234375, -0.938385009765625, -0.9090576171875, -0.879730224609375, -0.85040283203125, -0.821075439453125, -0.791748046875, -0.762420654296875, -0.73309326171875, -0.703765869140625, -0.6744384765625, -0.645111083984375, -0.61578369140625, -0.586456298828125, -0.55712890625, -0.527801513671875, -0.49847412109375, -0.469146728515625, -0.4398193359375, -0.410491943359375, -0.38116455078125, -0.351837158203125, -0.322509765625, -0.293182373046875, -0.26385498046875, -0.234527587890625, -0.2052001953125, -0.175872802734375, -0.14654541015625, -0.117218017578125, -0.087890625, -0.058563232421875, -0.02923583984375, 9.1552734375e-05, 0.0294189453125, 0.058746337890625, 0.08807373046875, 0.117401123046875, 0.146728515625, 0.176055908203125, 0.20538330078125, 0.234710693359375, 0.2640380859375, 0.293365478515625, 0.32269287109375, 0.352020263671875, 0.38134765625, 0.410675048828125, 0.44000244140625, 0.469329833984375, 0.4986572265625, 0.527984619140625, 0.55731201171875, 0.586639404296875, 0.615966796875, 0.645294189453125, 0.67462158203125, 0.703948974609375, 0.7332763671875, 0.762603759765625, 0.79193115234375, 0.821258544921875, 0.8505859375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 12.0, 82.0, 841.0, 80.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.266066312789917, -2.5464601516723633, -1.8268537521362305, -1.1072475910186768, -0.38764119148254395, 0.33196520805358887, 1.0515711307525635, 1.7711775302886963, 2.490783929824829, 3.210390090942383, 3.9299964904785156, 4.649602890014648, 5.369209289550781, 6.088815689086914, 6.8084211349487305, 7.528027534484863, 8.247633934020996, 8.967240333557129, 9.686846733093262, 10.406452178955078, 11.126058578491211, 11.845664978027344, 12.565271377563477, 13.28487777709961, 14.004484176635742, 14.724090576171875, 15.443696975708008, 16.16330337524414, 16.882909774780273, 17.602516174316406, 18.322120666503906, 19.041728973388672, 19.761333465576172, 20.480939865112305, 21.200546264648438, 21.92015266418457, 22.639759063720703, 23.359365463256836, 24.07897186279297, 24.79857635498047, 25.518184661865234, 26.237791061401367, 26.9573974609375, 27.677003860473633, 28.396610260009766, 29.1162166595459, 29.83582305908203, 30.55542755126953, 31.275033950805664, 31.994640350341797, 32.7142448425293, 33.43385314941406, 34.15345764160156, 34.87306594848633, 35.59267044067383, 36.312278747558594, 37.031883239746094, 37.751487731933594, 38.47109603881836, 39.19070053100586, 39.910308837890625, 40.629913330078125, 41.34952163696289, 42.06912612915039, 42.788734436035156]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 7.0, 4.0, 15.0, 16.0, 12.0, 27.0, 24.0, 26.0, 18.0, 21.0, 44.0, 43.0, 45.0, 55.0, 49.0, 51.0, 45.0, 66.0, 45.0, 47.0, 50.0, 37.0, 43.0, 32.0, 27.0, 28.0, 25.0, 24.0, 14.0, 10.0, 10.0, 10.0, 4.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3538265228271484, -2.278740406036377, -2.2036545276641846, -2.128568649291992, -2.0534825325012207, -1.9783965349197388, -1.9033105373382568, -1.828224539756775, -1.753138542175293, -1.678052544593811, -1.602966547012329, -1.5278805494308472, -1.4527945518493652, -1.3777085542678833, -1.3026225566864014, -1.2275365591049194, -1.1524505615234375, -1.0773645639419556, -1.0022785663604736, -0.9271925687789917, -0.8521065711975098, -0.7770205736160278, -0.7019345760345459, -0.626848578453064, -0.551762580871582, -0.4766765832901001, -0.40159058570861816, -0.32650458812713623, -0.2514185905456543, -0.17633259296417236, -0.10124659538269043, -0.026160597801208496, 0.04892563819885254, 0.12401163578033447, 0.1990976333618164, 0.27418363094329834, 0.3492696285247803, 0.4243556261062622, 0.49944162368774414, 0.5745276212692261, 0.649613618850708, 0.7246996164321899, 0.7997856140136719, 0.8748716115951538, 0.9499576091766357, 1.0250436067581177, 1.1001296043395996, 1.1752156019210815, 1.2503015995025635, 1.3253875970840454, 1.4004735946655273, 1.4755595922470093, 1.5506455898284912, 1.6257315874099731, 1.700817584991455, 1.775903582572937, 1.850989580154419, 1.9260755777359009, 2.001161575317383, 2.0762476921081543, 2.1513335704803467, 2.226419448852539, 2.3015055656433105, 2.376591682434082, 2.4516775608062744]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 7.0, 13.0, 11.0, 21.0, 16.0, 30.0, 62.0, 82.0, 100.0, 135.0, 206.0, 292.0, 441.0, 709.0, 1094.0, 2171.0, 4099.0, 9931.0, 41239.0, 441964.0, 481303.0, 44344.0, 10372.0, 4281.0, 2227.0, 1250.0, 765.0, 449.0, 318.0, 182.0, 124.0, 78.0, 65.0, 38.0, 35.0, 27.0, 15.0, 15.0, 10.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.5009765625, -1.4555206298828125, -1.410064697265625, -1.3646087646484375, -1.31915283203125, -1.2736968994140625, -1.228240966796875, -1.1827850341796875, -1.1373291015625, -1.0918731689453125, -1.046417236328125, -1.0009613037109375, -0.95550537109375, -0.9100494384765625, -0.864593505859375, -0.8191375732421875, -0.773681640625, -0.7282257080078125, -0.682769775390625, -0.6373138427734375, -0.59185791015625, -0.5464019775390625, -0.500946044921875, -0.4554901123046875, -0.4100341796875, -0.3645782470703125, -0.319122314453125, -0.2736663818359375, -0.22821044921875, -0.1827545166015625, -0.137298583984375, -0.0918426513671875, -0.04638671875, -0.0009307861328125, 0.044525146484375, 0.0899810791015625, 0.13543701171875, 0.1808929443359375, 0.226348876953125, 0.2718048095703125, 0.3172607421875, 0.3627166748046875, 0.408172607421875, 0.4536285400390625, 0.49908447265625, 0.5445404052734375, 0.589996337890625, 0.6354522705078125, 0.680908203125, 0.7263641357421875, 0.771820068359375, 0.8172760009765625, 0.86273193359375, 0.9081878662109375, 0.953643798828125, 0.9990997314453125, 1.0445556640625, 1.0900115966796875, 1.135467529296875, 1.1809234619140625, 1.22637939453125, 1.2718353271484375, 1.317291259765625, 1.3627471923828125, 1.408203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 15.0, 9.0, 12.0, 9.0, 23.0, 26.0, 33.0, 24.0, 42.0, 51.0, 70.0, 69.0, 65.0, 54.0, 65.0, 67.0, 64.0, 49.0, 45.0, 34.0, 27.0, 31.0, 26.0, 19.0, 17.0, 13.0, 10.0, 5.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.59027099609375, -0.5716552734375, -0.55303955078125, -0.534423828125, -0.51580810546875, -0.4971923828125, -0.47857666015625, -0.4599609375, -0.44134521484375, -0.4227294921875, -0.40411376953125, -0.385498046875, -0.36688232421875, -0.3482666015625, -0.32965087890625, -0.31103515625, -0.29241943359375, -0.2738037109375, -0.25518798828125, -0.236572265625, -0.21795654296875, -0.1993408203125, -0.18072509765625, -0.162109375, -0.14349365234375, -0.1248779296875, -0.10626220703125, -0.087646484375, -0.06903076171875, -0.0504150390625, -0.03179931640625, -0.01318359375, 0.00543212890625, 0.0240478515625, 0.04266357421875, 0.061279296875, 0.07989501953125, 0.0985107421875, 0.11712646484375, 0.1357421875, 0.15435791015625, 0.1729736328125, 0.19158935546875, 0.210205078125, 0.22882080078125, 0.2474365234375, 0.26605224609375, 0.28466796875, 0.30328369140625, 0.3218994140625, 0.34051513671875, 0.359130859375, 0.37774658203125, 0.3963623046875, 0.41497802734375, 0.43359375, 0.45220947265625, 0.4708251953125, 0.48944091796875, 0.508056640625, 0.52667236328125, 0.5452880859375, 0.56390380859375, 0.58251953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 4.0, 12.0, 10.0, 8.0, 8.0, 11.0, 16.0, 16.0, 21.0, 23.0, 36.0, 30.0, 39.0, 62.0, 93.0, 254.0, 991.0, 7010.0, 63030.0, 408635.0, 472696.0, 84194.0, 9393.0, 1223.0, 286.0, 101.0, 70.0, 42.0, 30.0, 26.0, 24.0, 30.0, 18.0, 22.0, 10.0, 8.0, 9.0, 9.0, 2.0, 12.0, 6.0, 3.0, 6.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0263671875, -0.9962387084960938, -0.9661102294921875, -0.9359817504882812, -0.905853271484375, -0.8757247924804688, -0.8455963134765625, -0.8154678344726562, -0.78533935546875, -0.7552108764648438, -0.7250823974609375, -0.6949539184570312, -0.664825439453125, -0.6346969604492188, -0.6045684814453125, -0.5744400024414062, -0.5443115234375, -0.5141830444335938, -0.4840545654296875, -0.45392608642578125, -0.423797607421875, -0.39366912841796875, -0.3635406494140625, -0.33341217041015625, -0.30328369140625, -0.27315521240234375, -0.2430267333984375, -0.21289825439453125, -0.182769775390625, -0.15264129638671875, -0.1225128173828125, -0.09238433837890625, -0.062255859375, -0.03212738037109375, -0.0019989013671875, 0.02812957763671875, 0.058258056640625, 0.08838653564453125, 0.1185150146484375, 0.14864349365234375, 0.17877197265625, 0.20890045166015625, 0.2390289306640625, 0.26915740966796875, 0.299285888671875, 0.32941436767578125, 0.3595428466796875, 0.38967132568359375, 0.4197998046875, 0.44992828369140625, 0.4800567626953125, 0.5101852416992188, 0.540313720703125, 0.5704421997070312, 0.6005706787109375, 0.6306991577148438, 0.66082763671875, 0.6909561157226562, 0.7210845947265625, 0.7512130737304688, 0.781341552734375, 0.8114700317382812, 0.8415985107421875, 0.8717269897460938, 0.90185546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 3.0, 6.0, 14.0, 14.0, 17.0, 22.0, 13.0, 18.0, 25.0, 16.0, 25.0, 25.0, 18.0, 34.0, 36.0, 35.0, 29.0, 29.0, 43.0, 35.0, 35.0, 28.0, 31.0, 33.0, 37.0, 34.0, 32.0, 31.0, 27.0, 27.0, 40.0, 28.0, 17.0, 16.0, 16.0, 18.0, 7.0, 13.0, 13.0, 14.0, 5.0, 10.0, 3.0, 6.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.9501953125, -0.9215240478515625, -0.892852783203125, -0.8641815185546875, -0.83551025390625, -0.8068389892578125, -0.778167724609375, -0.7494964599609375, -0.7208251953125, -0.6921539306640625, -0.663482666015625, -0.6348114013671875, -0.60614013671875, -0.5774688720703125, -0.548797607421875, -0.5201263427734375, -0.491455078125, -0.4627838134765625, -0.434112548828125, -0.4054412841796875, -0.37677001953125, -0.3480987548828125, -0.319427490234375, -0.2907562255859375, -0.2620849609375, -0.2334136962890625, -0.204742431640625, -0.1760711669921875, -0.14739990234375, -0.1187286376953125, -0.090057373046875, -0.0613861083984375, -0.03271484375, -0.0040435791015625, 0.024627685546875, 0.0532989501953125, 0.08197021484375, 0.1106414794921875, 0.139312744140625, 0.1679840087890625, 0.1966552734375, 0.2253265380859375, 0.253997802734375, 0.2826690673828125, 0.31134033203125, 0.3400115966796875, 0.368682861328125, 0.3973541259765625, 0.426025390625, 0.4546966552734375, 0.483367919921875, 0.5120391845703125, 0.54071044921875, 0.5693817138671875, 0.598052978515625, 0.6267242431640625, 0.6553955078125, 0.6840667724609375, 0.712738037109375, 0.7414093017578125, 0.77008056640625, 0.7987518310546875, 0.827423095703125, 0.8560943603515625, 0.884765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 12.0, 22.0, 22.0, 30.0, 39.0, 59.0, 92.0, 162.0, 272.0, 514.0, 982.0, 2161.0, 5677.0, 19603.0, 90168.0, 380780.0, 411639.0, 103047.0, 22505.0, 6197.0, 2243.0, 1019.0, 510.0, 282.0, 172.0, 110.0, 62.0, 47.0, 29.0, 24.0, 18.0, 4.0, 14.0, 9.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.25439453125, -0.24692153930664062, -0.23944854736328125, -0.23197555541992188, -0.2245025634765625, -0.21702957153320312, -0.20955657958984375, -0.20208358764648438, -0.194610595703125, -0.18713760375976562, -0.17966461181640625, -0.17219161987304688, -0.1647186279296875, -0.15724563598632812, -0.14977264404296875, -0.14229965209960938, -0.13482666015625, -0.12735366821289062, -0.11988067626953125, -0.11240768432617188, -0.1049346923828125, -0.09746170043945312, -0.08998870849609375, -0.08251571655273438, -0.075042724609375, -0.06756973266601562, -0.06009674072265625, -0.052623748779296875, -0.0451507568359375, -0.037677764892578125, -0.03020477294921875, -0.022731781005859375, -0.0152587890625, -0.007785797119140625, -0.00031280517578125, 0.007160186767578125, 0.0146331787109375, 0.022106170654296875, 0.02957916259765625, 0.037052154541015625, 0.044525146484375, 0.051998138427734375, 0.05947113037109375, 0.06694412231445312, 0.0744171142578125, 0.08189010620117188, 0.08936309814453125, 0.09683609008789062, 0.10430908203125, 0.11178207397460938, 0.11925506591796875, 0.12672805786132812, 0.1342010498046875, 0.14167404174804688, 0.14914703369140625, 0.15662002563476562, 0.164093017578125, 0.17156600952148438, 0.17903900146484375, 0.18651199340820312, 0.1939849853515625, 0.20145797729492188, 0.20893096923828125, 0.21640396118164062, 0.223876953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 11.0, 5.0, 22.0, 20.0, 38.0, 45.0, 52.0, 58.0, 87.0, 90.0, 95.0, 91.0, 73.0, 68.0, 53.0, 44.0, 28.0, 26.0, 21.0, 12.0, 10.0, 7.0, 2.0, 3.0, 6.0, 7.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.008676528930664e-05, -1.941155642271042e-05, -1.8736347556114197e-05, -1.8061138689517975e-05, -1.7385929822921753e-05, -1.671072095632553e-05, -1.603551208972931e-05, -1.5360303223133087e-05, -1.4685094356536865e-05, -1.4009885489940643e-05, -1.3334676623344421e-05, -1.26594677567482e-05, -1.1984258890151978e-05, -1.1309050023555756e-05, -1.0633841156959534e-05, -9.958632290363312e-06, -9.28342342376709e-06, -8.608214557170868e-06, -7.933005690574646e-06, -7.257796823978424e-06, -6.582587957382202e-06, -5.90737909078598e-06, -5.232170224189758e-06, -4.556961357593536e-06, -3.8817524909973145e-06, -3.2065436244010925e-06, -2.5313347578048706e-06, -1.8561258912086487e-06, -1.1809170246124268e-06, -5.057081580162048e-07, 1.695007085800171e-07, 8.44709575176239e-07, 1.519918441772461e-06, 2.195127308368683e-06, 2.8703361749649048e-06, 3.5455450415611267e-06, 4.220753908157349e-06, 4.8959627747535706e-06, 5.5711716413497925e-06, 6.246380507946014e-06, 6.921589374542236e-06, 7.596798241138458e-06, 8.27200710773468e-06, 8.947215974330902e-06, 9.622424840927124e-06, 1.0297633707523346e-05, 1.0972842574119568e-05, 1.164805144071579e-05, 1.2323260307312012e-05, 1.2998469173908234e-05, 1.3673678040504456e-05, 1.4348886907100677e-05, 1.50240957736969e-05, 1.569930464029312e-05, 1.6374513506889343e-05, 1.7049722373485565e-05, 1.7724931240081787e-05, 1.840014010667801e-05, 1.907534897327423e-05, 1.9750557839870453e-05, 2.0425766706466675e-05, 2.1100975573062897e-05, 2.177618443965912e-05, 2.245139330625534e-05, 2.3126602172851562e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 5.0, 6.0, 10.0, 14.0, 46.0, 110.0, 288.0, 675.0, 2221.0, 8798.0, 51933.0, 431966.0, 479041.0, 59942.0, 9861.0, 2446.0, 729.0, 251.0, 110.0, 47.0, 17.0, 18.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2509765625, -0.23958587646484375, -0.2281951904296875, -0.21680450439453125, -0.205413818359375, -0.19402313232421875, -0.1826324462890625, -0.17124176025390625, -0.15985107421875, -0.14846038818359375, -0.1370697021484375, -0.12567901611328125, -0.114288330078125, -0.10289764404296875, -0.0915069580078125, -0.08011627197265625, -0.0687255859375, -0.05733489990234375, -0.0459442138671875, -0.03455352783203125, -0.023162841796875, -0.01177215576171875, -0.0003814697265625, 0.01100921630859375, 0.02239990234375, 0.03379058837890625, 0.0451812744140625, 0.05657196044921875, 0.067962646484375, 0.07935333251953125, 0.0907440185546875, 0.10213470458984375, 0.113525390625, 0.12491607666015625, 0.1363067626953125, 0.14769744873046875, 0.159088134765625, 0.17047882080078125, 0.1818695068359375, 0.19326019287109375, 0.20465087890625, 0.21604156494140625, 0.2274322509765625, 0.23882293701171875, 0.250213623046875, 0.26160430908203125, 0.2729949951171875, 0.28438568115234375, 0.2957763671875, 0.30716705322265625, 0.3185577392578125, 0.32994842529296875, 0.341339111328125, 0.35272979736328125, 0.3641204833984375, 0.37551116943359375, 0.38690185546875, 0.39829254150390625, 0.4096832275390625, 0.42107391357421875, 0.432464599609375, 0.44385528564453125, 0.4552459716796875, 0.46663665771484375, 0.47802734375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 6.0, 7.0, 10.0, 13.0, 10.0, 22.0, 31.0, 40.0, 64.0, 46.0, 76.0, 79.0, 72.0, 74.0, 74.0, 74.0, 61.0, 43.0, 49.0, 38.0, 28.0, 22.0, 14.0, 15.0, 8.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2293701171875, -0.2222137451171875, -0.215057373046875, -0.2079010009765625, -0.20074462890625, -0.1935882568359375, -0.186431884765625, -0.1792755126953125, -0.172119140625, -0.1649627685546875, -0.157806396484375, -0.1506500244140625, -0.14349365234375, -0.1363372802734375, -0.129180908203125, -0.1220245361328125, -0.1148681640625, -0.1077117919921875, -0.100555419921875, -0.0933990478515625, -0.08624267578125, -0.0790863037109375, -0.071929931640625, -0.0647735595703125, -0.0576171875, -0.0504608154296875, -0.043304443359375, -0.0361480712890625, -0.02899169921875, -0.0218353271484375, -0.014678955078125, -0.0075225830078125, -0.0003662109375, 0.0067901611328125, 0.013946533203125, 0.0211029052734375, 0.02825927734375, 0.0354156494140625, 0.042572021484375, 0.0497283935546875, 0.056884765625, 0.0640411376953125, 0.071197509765625, 0.0783538818359375, 0.08551025390625, 0.0926666259765625, 0.099822998046875, 0.1069793701171875, 0.1141357421875, 0.1212921142578125, 0.128448486328125, 0.1356048583984375, 0.14276123046875, 0.1499176025390625, 0.157073974609375, 0.1642303466796875, 0.17138671875, 0.1785430908203125, 0.185699462890625, 0.1928558349609375, 0.20001220703125, 0.2071685791015625, 0.214324951171875, 0.2214813232421875, 0.2286376953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 19.0, 58.0, 212.0, 333.0, 251.0, 92.0, 33.0, 12.0, 2.0, 2.0, 0.0, 1.0], "bins": [-17.187150955200195, -16.878541946411133, -16.56993293762207, -16.261323928833008, -15.952713966369629, -15.644104957580566, -15.335495948791504, -15.026885986328125, -14.718276977539062, -14.40966796875, -14.101058959960938, -13.792448997497559, -13.483839988708496, -13.175230979919434, -12.866621971130371, -12.558012008666992, -12.24940299987793, -11.940793991088867, -11.632184982299805, -11.323575019836426, -11.014966011047363, -10.7063570022583, -10.397747993469238, -10.08913803100586, -9.780529975891113, -9.47192096710205, -9.163311958312988, -8.85470199584961, -8.546092987060547, -8.237483978271484, -7.928874969482422, -7.620265483856201, -7.311656475067139, -7.003047466278076, -6.6944379806518555, -6.385828971862793, -6.077219486236572, -5.76861047744751, -5.460000991821289, -5.151391983032227, -4.842782974243164, -4.534173965454102, -4.225564479827881, -3.9169554710388184, -3.6083459854125977, -3.299736976623535, -2.9911277294158936, -2.682518482208252, -2.3739089965820312, -2.0652997493743896, -1.756690502166748, -1.448081374168396, -1.1394721269607544, -0.8308628797531128, -0.5222537517547607, -0.21364450454711914, 0.09496474266052246, 0.4035739600658417, 0.7121831774711609, 1.0207923650741577, 1.3294016122817993, 1.638010859489441, 1.946619987487793, 2.2552292346954346, 2.563838481903076]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 8.0, 9.0, 8.0, 14.0, 12.0, 16.0, 18.0, 25.0, 24.0, 24.0, 33.0, 30.0, 46.0, 48.0, 57.0, 40.0, 60.0, 43.0, 49.0, 43.0, 50.0, 44.0, 39.0, 33.0, 41.0, 30.0, 22.0, 26.0, 11.0, 15.0, 12.0, 13.0, 14.0, 7.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.65399169921875, -5.475531101226807, -5.297070503234863, -5.11860990524292, -4.940149307250977, -4.761688232421875, -4.58322811126709, -4.404767036437988, -4.226306438446045, -4.047845840454102, -3.869385242462158, -3.690924644470215, -3.5124638080596924, -3.334003210067749, -3.1555426120758057, -2.977081775665283, -2.798621416091919, -2.6201608180999756, -2.4417002201080322, -2.2632393836975098, -2.0847787857055664, -1.906318187713623, -1.7278575897216797, -1.5493968725204468, -1.3709362745285034, -1.19247567653656, -1.0140149593353271, -0.8355543613433838, -0.6570937037467957, -0.4786330461502075, -0.30017244815826416, -0.12171173095703125, 0.05674886703491211, 0.23520950973033905, 0.413670152425766, 0.5921307802200317, 0.7705914378166199, 0.949052095413208, 1.1275126934051514, 1.3059734106063843, 1.4844340085983276, 1.662894606590271, 1.841355323791504, 2.0198159217834473, 2.1982765197753906, 2.376737117767334, 2.5551977157592773, 2.7336585521698, 2.912119150161743, 3.0905797481536865, 3.26904034614563, 3.4475011825561523, 3.6259617805480957, 3.804422378540039, 3.9828829765319824, 4.161343574523926, 4.339804172515869, 4.5182647705078125, 4.696725368499756, 4.875185966491699, 5.053646564483643, 5.232107162475586, 5.4105682373046875, 5.589028835296631, 5.767489433288574]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 2.0, 6.0, 8.0, 15.0, 9.0, 6.0, 9.0, 20.0, 21.0, 24.0, 18.0, 33.0, 45.0, 79.0, 96.0, 254.0, 640.0, 2363.0, 20859.0, 3136652.0, 1018685.0, 11618.0, 1716.0, 505.0, 211.0, 95.0, 74.0, 39.0, 38.0, 14.0, 16.0, 16.0, 19.0, 11.0, 8.0, 15.0, 8.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.683441162109375, -2.58367919921875, -2.483917236328125, -2.3841552734375, -2.284393310546875, -2.18463134765625, -2.084869384765625, -1.985107421875, -1.885345458984375, -1.78558349609375, -1.685821533203125, -1.5860595703125, -1.486297607421875, -1.38653564453125, -1.286773681640625, -1.18701171875, -1.087249755859375, -0.98748779296875, -0.887725830078125, -0.7879638671875, -0.688201904296875, -0.58843994140625, -0.488677978515625, -0.388916015625, -0.289154052734375, -0.18939208984375, -0.089630126953125, 0.0101318359375, 0.109893798828125, 0.20965576171875, 0.309417724609375, 0.4091796875, 0.508941650390625, 0.60870361328125, 0.708465576171875, 0.8082275390625, 0.907989501953125, 1.00775146484375, 1.107513427734375, 1.207275390625, 1.307037353515625, 1.40679931640625, 1.506561279296875, 1.6063232421875, 1.706085205078125, 1.80584716796875, 1.905609130859375, 2.00537109375, 2.105133056640625, 2.20489501953125, 2.304656982421875, 2.4044189453125, 2.504180908203125, 2.60394287109375, 2.703704833984375, 2.803466796875, 2.903228759765625, 3.00299072265625, 3.102752685546875, 3.2025146484375, 3.302276611328125, 3.40203857421875, 3.501800537109375, 3.6015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 4.0, 7.0, 6.0, 14.0, 14.0, 14.0, 6.0, 16.0, 26.0, 28.0, 30.0, 33.0, 34.0, 42.0, 46.0, 44.0, 59.0, 51.0, 46.0, 63.0, 49.0, 46.0, 45.0, 38.0, 42.0, 31.0, 22.0, 16.0, 25.0, 21.0, 20.0, 15.0, 6.0, 10.0, 7.0, 8.0, 3.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.470947265625, -0.45648193359375, -0.4420166015625, -0.42755126953125, -0.4130859375, -0.39862060546875, -0.3841552734375, -0.36968994140625, -0.355224609375, -0.34075927734375, -0.3262939453125, -0.31182861328125, -0.29736328125, -0.28289794921875, -0.2684326171875, -0.25396728515625, -0.239501953125, -0.22503662109375, -0.2105712890625, -0.19610595703125, -0.181640625, -0.16717529296875, -0.1527099609375, -0.13824462890625, -0.123779296875, -0.10931396484375, -0.0948486328125, -0.08038330078125, -0.06591796875, -0.05145263671875, -0.0369873046875, -0.02252197265625, -0.008056640625, 0.00640869140625, 0.0208740234375, 0.03533935546875, 0.0498046875, 0.06427001953125, 0.0787353515625, 0.09320068359375, 0.107666015625, 0.12213134765625, 0.1365966796875, 0.15106201171875, 0.16552734375, 0.17999267578125, 0.1944580078125, 0.20892333984375, 0.223388671875, 0.23785400390625, 0.2523193359375, 0.26678466796875, 0.28125, 0.29571533203125, 0.3101806640625, 0.32464599609375, 0.339111328125, 0.35357666015625, 0.3680419921875, 0.38250732421875, 0.39697265625, 0.41143798828125, 0.4259033203125, 0.44036865234375, 0.454833984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 7.0, 9.0, 11.0, 24.0, 25.0, 36.0, 63.0, 111.0, 193.0, 417.0, 775.0, 1695.0, 3861.0, 10449.0, 31700.0, 111856.0, 445305.0, 1736504.0, 1382339.0, 341587.0, 86962.0, 25806.0, 8461.0, 3305.0, 1402.0, 609.0, 312.0, 171.0, 103.0, 64.0, 34.0, 27.0, 16.0, 15.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70556640625, -0.6772384643554688, -0.6489105224609375, -0.6205825805664062, -0.592254638671875, -0.5639266967773438, -0.5355987548828125, -0.5072708129882812, -0.47894287109375, -0.45061492919921875, -0.4222869873046875, -0.39395904541015625, -0.365631103515625, -0.33730316162109375, -0.3089752197265625, -0.28064727783203125, -0.2523193359375, -0.22399139404296875, -0.1956634521484375, -0.16733551025390625, -0.139007568359375, -0.11067962646484375, -0.0823516845703125, -0.05402374267578125, -0.02569580078125, 0.00263214111328125, 0.0309600830078125, 0.05928802490234375, 0.087615966796875, 0.11594390869140625, 0.1442718505859375, 0.17259979248046875, 0.200927734375, 0.22925567626953125, 0.2575836181640625, 0.28591156005859375, 0.314239501953125, 0.34256744384765625, 0.3708953857421875, 0.39922332763671875, 0.42755126953125, 0.45587921142578125, 0.4842071533203125, 0.5125350952148438, 0.540863037109375, 0.5691909790039062, 0.5975189208984375, 0.6258468627929688, 0.6541748046875, 0.6825027465820312, 0.7108306884765625, 0.7391586303710938, 0.767486572265625, 0.7958145141601562, 0.8241424560546875, 0.8524703979492188, 0.88079833984375, 0.9091262817382812, 0.9374542236328125, 0.9657821655273438, 0.994110107421875, 1.0224380493164062, 1.0507659912109375, 1.0790939331054688, 1.107421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 7.0, 13.0, 23.0, 42.0, 33.0, 38.0, 64.0, 78.0, 98.0, 153.0, 199.0, 250.0, 320.0, 398.0, 475.0, 424.0, 338.0, 234.0, 218.0, 159.0, 117.0, 95.0, 91.0, 33.0, 42.0, 31.0, 24.0, 13.0, 16.0, 8.0, 4.0, 3.0, 6.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385009765625, -0.3698921203613281, -0.35477447509765625, -0.3396568298339844, -0.3245391845703125, -0.3094215393066406, -0.29430389404296875, -0.2791862487792969, -0.264068603515625, -0.24895095825195312, -0.23383331298828125, -0.21871566772460938, -0.2035980224609375, -0.18848037719726562, -0.17336273193359375, -0.15824508666992188, -0.14312744140625, -0.12800979614257812, -0.11289215087890625, -0.09777450561523438, -0.0826568603515625, -0.06753921508789062, -0.05242156982421875, -0.037303924560546875, -0.022186279296875, -0.007068634033203125, 0.00804901123046875, 0.023166656494140625, 0.0382843017578125, 0.053401947021484375, 0.06851959228515625, 0.08363723754882812, 0.0987548828125, 0.11387252807617188, 0.12899017333984375, 0.14410781860351562, 0.1592254638671875, 0.17434310913085938, 0.18946075439453125, 0.20457839965820312, 0.219696044921875, 0.23481369018554688, 0.24993133544921875, 0.2650489807128906, 0.2801666259765625, 0.2952842712402344, 0.31040191650390625, 0.3255195617675781, 0.34063720703125, 0.3557548522949219, 0.37087249755859375, 0.3859901428222656, 0.4011077880859375, 0.4162254333496094, 0.43134307861328125, 0.4464607238769531, 0.461578369140625, 0.4766960144042969, 0.49181365966796875, 0.5069313049316406, 0.5220489501953125, 0.5371665954589844, 0.5522842407226562, 0.5674018859863281, 0.58251953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 11.0, 41.0, 197.0, 322.0, 301.0, 95.0, 31.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.273847579956055, -8.005331993103027, -7.736815929412842, -7.468299865722656, -7.199783802032471, -6.931267738342285, -6.662752151489258, -6.394236087799072, -6.125720024108887, -5.857203960418701, -5.588688373565674, -5.320172309875488, -5.051656246185303, -4.783140182495117, -4.51462459564209, -4.246108531951904, -3.977592945098877, -3.7090771198272705, -3.440561056137085, -3.1720452308654785, -2.903529167175293, -2.6350133419036865, -2.36649751663208, -2.0979814529418945, -1.829465627670288, -1.560949683189392, -1.292433738708496, -1.0239179134368896, -0.7554019689559937, -0.48688602447509766, -0.2183701992034912, 0.050145745277404785, 0.3186616897583008, 0.5871776342391968, 0.855693519115448, 1.1242094039916992, 1.3927253484725952, 1.6612412929534912, 1.9297571182250977, 2.198273181915283, 2.4667890071868896, 2.735304832458496, 3.0038208961486816, 3.272336721420288, 3.5408525466918945, 3.80936861038208, 4.077884674072266, 4.346400260925293, 4.6149163246154785, 4.883432388305664, 5.151947975158691, 5.420464038848877, 5.6889801025390625, 5.95749568939209, 6.226011753082275, 6.494527816772461, 6.763043403625488, 7.031559467315674, 7.300075054168701, 7.568591117858887, 7.837107181549072, 8.105623245239258, 8.374138832092285, 8.642654418945312, 8.911170959472656]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 7.0, 9.0, 11.0, 14.0, 16.0, 17.0, 14.0, 31.0, 21.0, 33.0, 34.0, 36.0, 41.0, 42.0, 50.0, 37.0, 42.0, 37.0, 33.0, 52.0, 43.0, 30.0, 42.0, 41.0, 35.0, 38.0, 30.0, 31.0, 21.0, 24.0, 22.0, 10.0, 10.0, 8.0, 10.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5067453384399414, -1.4565467834472656, -1.4063481092453003, -1.3561495542526245, -1.3059508800506592, -1.2557523250579834, -1.2055537700653076, -1.1553552150726318, -1.1051565408706665, -1.0549579858779907, -1.0047593116760254, -0.9545607566833496, -0.904362142086029, -0.8541635274887085, -0.8039649724960327, -0.7537663578987122, -0.7035677433013916, -0.653369128704071, -0.6031705141067505, -0.5529719591140747, -0.5027733445167542, -0.4525747299194336, -0.4023761451244354, -0.35217756032943726, -0.3019789457321167, -0.25178033113479614, -0.20158174633979797, -0.1513831466436386, -0.10118454694747925, -0.05098593235015869, -0.0007873475551605225, 0.049411237239837646, 0.09960973262786865, 0.14980833232402802, 0.20000693202018738, 0.25020551681518555, 0.3004041314125061, 0.35060274600982666, 0.40080133080482483, 0.450999915599823, 0.5011985301971436, 0.5513971447944641, 0.6015957593917847, 0.6517943143844604, 0.701992928981781, 0.7521915435791016, 0.8023900985717773, 0.8525887131690979, 0.9027873277664185, 0.952985942363739, 1.0031845569610596, 1.0533831119537354, 1.1035816669464111, 1.1537803411483765, 1.2039788961410522, 1.2541775703430176, 1.3043761253356934, 1.3545746803283691, 1.4047733545303345, 1.4549719095230103, 1.5051705837249756, 1.5553691387176514, 1.6055676937103271, 1.655766248703003, 1.7059649229049683]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 6.0, 8.0, 9.0, 14.0, 11.0, 22.0, 26.0, 45.0, 53.0, 93.0, 113.0, 175.0, 337.0, 635.0, 1110.0, 2252.0, 4833.0, 11313.0, 27245.0, 68411.0, 166538.0, 305793.0, 256908.0, 119640.0, 47829.0, 19274.0, 8332.0, 3703.0, 1754.0, 843.0, 461.0, 262.0, 166.0, 91.0, 72.0, 46.0, 27.0, 32.0, 20.0, 14.0, 9.0, 12.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.85888671875, -0.8334808349609375, -0.808074951171875, -0.7826690673828125, -0.75726318359375, -0.7318572998046875, -0.706451416015625, -0.6810455322265625, -0.6556396484375, -0.6302337646484375, -0.604827880859375, -0.5794219970703125, -0.55401611328125, -0.5286102294921875, -0.503204345703125, -0.4777984619140625, -0.452392578125, -0.4269866943359375, -0.401580810546875, -0.3761749267578125, -0.35076904296875, -0.3253631591796875, -0.299957275390625, -0.2745513916015625, -0.2491455078125, -0.2237396240234375, -0.198333740234375, -0.1729278564453125, -0.14752197265625, -0.1221160888671875, -0.096710205078125, -0.0713043212890625, -0.0458984375, -0.0204925537109375, 0.004913330078125, 0.0303192138671875, 0.05572509765625, 0.0811309814453125, 0.106536865234375, 0.1319427490234375, 0.1573486328125, 0.1827545166015625, 0.208160400390625, 0.2335662841796875, 0.25897216796875, 0.2843780517578125, 0.309783935546875, 0.3351898193359375, 0.360595703125, 0.3860015869140625, 0.411407470703125, 0.4368133544921875, 0.46221923828125, 0.4876251220703125, 0.513031005859375, 0.5384368896484375, 0.5638427734375, 0.5892486572265625, 0.614654541015625, 0.6400604248046875, 0.66546630859375, 0.6908721923828125, 0.716278076171875, 0.7416839599609375, 0.76708984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 11.0, 7.0, 10.0, 22.0, 11.0, 19.0, 22.0, 26.0, 26.0, 37.0, 36.0, 44.0, 60.0, 47.0, 56.0, 59.0, 58.0, 51.0, 64.0, 43.0, 57.0, 33.0, 25.0, 29.0, 26.0, 21.0, 23.0, 12.0, 12.0, 10.0, 9.0, 10.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.492431640625, -0.4770164489746094, -0.46160125732421875, -0.4461860656738281, -0.4307708740234375, -0.4153556823730469, -0.39994049072265625, -0.3845252990722656, -0.369110107421875, -0.3536949157714844, -0.33827972412109375, -0.3228645324707031, -0.3074493408203125, -0.2920341491699219, -0.27661895751953125, -0.2612037658691406, -0.24578857421875, -0.23037338256835938, -0.21495819091796875, -0.19954299926757812, -0.1841278076171875, -0.16871261596679688, -0.15329742431640625, -0.13788223266601562, -0.122467041015625, -0.10705184936523438, -0.09163665771484375, -0.07622146606445312, -0.0608062744140625, -0.045391082763671875, -0.02997589111328125, -0.014560699462890625, 0.0008544921875, 0.016269683837890625, 0.03168487548828125, 0.047100067138671875, 0.0625152587890625, 0.07793045043945312, 0.09334564208984375, 0.10876083374023438, 0.124176025390625, 0.13959121704101562, 0.15500640869140625, 0.17042160034179688, 0.1858367919921875, 0.20125198364257812, 0.21666717529296875, 0.23208236694335938, 0.24749755859375, 0.2629127502441406, 0.27832794189453125, 0.2937431335449219, 0.3091583251953125, 0.3245735168457031, 0.33998870849609375, 0.3554039001464844, 0.370819091796875, 0.3862342834472656, 0.40164947509765625, 0.4170646667480469, 0.4324798583984375, 0.4478950500488281, 0.46331024169921875, 0.4787254333496094, 0.494140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 9.0, 11.0, 18.0, 15.0, 27.0, 17.0, 23.0, 25.0, 32.0, 36.0, 51.0, 74.0, 128.0, 429.0, 3754.0, 138332.0, 835864.0, 66792.0, 2111.0, 307.0, 109.0, 69.0, 54.0, 32.0, 30.0, 27.0, 34.0, 30.0, 17.0, 15.0, 9.0, 11.0, 7.0, 6.0, 8.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.78515625, -2.687103271484375, -2.58905029296875, -2.490997314453125, -2.3929443359375, -2.294891357421875, -2.19683837890625, -2.098785400390625, -2.000732421875, -1.902679443359375, -1.80462646484375, -1.706573486328125, -1.6085205078125, -1.510467529296875, -1.41241455078125, -1.314361572265625, -1.21630859375, -1.118255615234375, -1.02020263671875, -0.922149658203125, -0.8240966796875, -0.726043701171875, -0.62799072265625, -0.529937744140625, -0.431884765625, -0.333831787109375, -0.23577880859375, -0.137725830078125, -0.0396728515625, 0.058380126953125, 0.15643310546875, 0.254486083984375, 0.3525390625, 0.450592041015625, 0.54864501953125, 0.646697998046875, 0.7447509765625, 0.842803955078125, 0.94085693359375, 1.038909912109375, 1.136962890625, 1.235015869140625, 1.33306884765625, 1.431121826171875, 1.5291748046875, 1.627227783203125, 1.72528076171875, 1.823333740234375, 1.92138671875, 2.019439697265625, 2.11749267578125, 2.215545654296875, 2.3135986328125, 2.411651611328125, 2.50970458984375, 2.607757568359375, 2.705810546875, 2.803863525390625, 2.90191650390625, 2.999969482421875, 3.0980224609375, 3.196075439453125, 3.29412841796875, 3.392181396484375, 3.490234375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 9.0, 4.0, 12.0, 13.0, 15.0, 16.0, 18.0, 24.0, 21.0, 15.0, 31.0, 23.0, 33.0, 35.0, 35.0, 32.0, 43.0, 30.0, 48.0, 27.0, 45.0, 31.0, 36.0, 35.0, 31.0, 52.0, 32.0, 41.0, 27.0, 21.0, 28.0, 28.0, 12.0, 15.0, 13.0, 6.0, 8.0, 13.0, 10.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.759765625, -0.7356643676757812, -0.7115631103515625, -0.6874618530273438, -0.663360595703125, -0.6392593383789062, -0.6151580810546875, -0.5910568237304688, -0.56695556640625, -0.5428543090820312, -0.5187530517578125, -0.49465179443359375, -0.470550537109375, -0.44644927978515625, -0.4223480224609375, -0.39824676513671875, -0.3741455078125, -0.35004425048828125, -0.3259429931640625, -0.30184173583984375, -0.277740478515625, -0.25363922119140625, -0.2295379638671875, -0.20543670654296875, -0.18133544921875, -0.15723419189453125, -0.1331329345703125, -0.10903167724609375, -0.084930419921875, -0.06082916259765625, -0.0367279052734375, -0.01262664794921875, 0.011474609375, 0.03557586669921875, 0.0596771240234375, 0.08377838134765625, 0.107879638671875, 0.13198089599609375, 0.1560821533203125, 0.18018341064453125, 0.20428466796875, 0.22838592529296875, 0.2524871826171875, 0.27658843994140625, 0.300689697265625, 0.32479095458984375, 0.3488922119140625, 0.37299346923828125, 0.3970947265625, 0.42119598388671875, 0.4452972412109375, 0.46939849853515625, 0.493499755859375, 0.5176010131835938, 0.5417022705078125, 0.5658035278320312, 0.58990478515625, 0.6140060424804688, 0.6381072998046875, 0.6622085571289062, 0.686309814453125, 0.7104110717773438, 0.7345123291015625, 0.7586135864257812, 0.78271484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 5.0, 8.0, 11.0, 11.0, 24.0, 18.0, 48.0, 75.0, 134.0, 244.0, 415.0, 917.0, 1928.0, 4230.0, 10799.0, 30880.0, 109807.0, 363967.0, 365521.0, 109711.0, 30839.0, 10724.0, 4322.0, 1908.0, 921.0, 472.0, 243.0, 134.0, 73.0, 37.0, 41.0, 25.0, 18.0, 12.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.53955078125, -0.5232009887695312, -0.5068511962890625, -0.49050140380859375, -0.474151611328125, -0.45780181884765625, -0.4414520263671875, -0.42510223388671875, -0.40875244140625, -0.39240264892578125, -0.3760528564453125, -0.35970306396484375, -0.343353271484375, -0.32700347900390625, -0.3106536865234375, -0.29430389404296875, -0.2779541015625, -0.26160430908203125, -0.2452545166015625, -0.22890472412109375, -0.212554931640625, -0.19620513916015625, -0.1798553466796875, -0.16350555419921875, -0.14715576171875, -0.13080596923828125, -0.1144561767578125, -0.09810638427734375, -0.081756591796875, -0.06540679931640625, -0.0490570068359375, -0.03270721435546875, -0.016357421875, -7.62939453125e-06, 0.0163421630859375, 0.03269195556640625, 0.049041748046875, 0.06539154052734375, 0.0817413330078125, 0.09809112548828125, 0.11444091796875, 0.13079071044921875, 0.1471405029296875, 0.16349029541015625, 0.179840087890625, 0.19618988037109375, 0.2125396728515625, 0.22888946533203125, 0.2452392578125, 0.26158905029296875, 0.2779388427734375, 0.29428863525390625, 0.310638427734375, 0.32698822021484375, 0.3433380126953125, 0.35968780517578125, 0.37603759765625, 0.39238739013671875, 0.4087371826171875, 0.42508697509765625, 0.441436767578125, 0.45778656005859375, 0.4741363525390625, 0.49048614501953125, 0.5068359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 14.0, 8.0, 16.0, 17.0, 24.0, 29.0, 56.0, 74.0, 94.0, 119.0, 127.0, 139.0, 72.0, 58.0, 48.0, 43.0, 16.0, 8.0, 8.0, 11.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.647275924682617e-05, -7.418449968099594e-05, -7.189624011516571e-05, -6.960798054933548e-05, -6.731972098350525e-05, -6.503146141767502e-05, -6.274320185184479e-05, -6.045494228601456e-05, -5.8166682720184326e-05, -5.5878423154354095e-05, -5.3590163588523865e-05, -5.1301904022693634e-05, -4.90136444568634e-05, -4.672538489103317e-05, -4.443712532520294e-05, -4.214886575937271e-05, -3.986060619354248e-05, -3.757234662771225e-05, -3.528408706188202e-05, -3.299582749605179e-05, -3.070756793022156e-05, -2.8419308364391327e-05, -2.6131048798561096e-05, -2.3842789232730865e-05, -2.1554529666900635e-05, -1.9266270101070404e-05, -1.6978010535240173e-05, -1.4689750969409943e-05, -1.2401491403579712e-05, -1.0113231837749481e-05, -7.82497227191925e-06, -5.53671270608902e-06, -3.248453140258789e-06, -9.601935744285583e-07, 1.3280659914016724e-06, 3.616325557231903e-06, 5.904585123062134e-06, 8.192844688892365e-06, 1.0481104254722595e-05, 1.2769363820552826e-05, 1.5057623386383057e-05, 1.7345882952213287e-05, 1.9634142518043518e-05, 2.192240208387375e-05, 2.421066164970398e-05, 2.649892121553421e-05, 2.878718078136444e-05, 3.107544034719467e-05, 3.33636999130249e-05, 3.565195947885513e-05, 3.7940219044685364e-05, 4.0228478610515594e-05, 4.2516738176345825e-05, 4.4804997742176056e-05, 4.709325730800629e-05, 4.938151687383652e-05, 5.166977643966675e-05, 5.395803600549698e-05, 5.624629557132721e-05, 5.853455513715744e-05, 6.082281470298767e-05, 6.31110742688179e-05, 6.539933383464813e-05, 6.768759340047836e-05, 6.99758529663086e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 2.0, 7.0, 10.0, 15.0, 15.0, 16.0, 12.0, 16.0, 29.0, 30.0, 45.0, 75.0, 153.0, 463.0, 2400.0, 21764.0, 322943.0, 638040.0, 56431.0, 4733.0, 771.0, 233.0, 102.0, 40.0, 25.0, 27.0, 23.0, 21.0, 19.0, 12.0, 13.0, 9.0, 4.0, 8.0, 4.0, 6.0, 3.0, 8.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97119140625, -0.941009521484375, -0.91082763671875, -0.880645751953125, -0.8504638671875, -0.820281982421875, -0.79010009765625, -0.759918212890625, -0.729736328125, -0.699554443359375, -0.66937255859375, -0.639190673828125, -0.6090087890625, -0.578826904296875, -0.54864501953125, -0.518463134765625, -0.48828125, -0.458099365234375, -0.42791748046875, -0.397735595703125, -0.3675537109375, -0.337371826171875, -0.30718994140625, -0.277008056640625, -0.246826171875, -0.216644287109375, -0.18646240234375, -0.156280517578125, -0.1260986328125, -0.095916748046875, -0.06573486328125, -0.035552978515625, -0.00537109375, 0.024810791015625, 0.05499267578125, 0.085174560546875, 0.1153564453125, 0.145538330078125, 0.17572021484375, 0.205902099609375, 0.236083984375, 0.266265869140625, 0.29644775390625, 0.326629638671875, 0.3568115234375, 0.386993408203125, 0.41717529296875, 0.447357177734375, 0.4775390625, 0.507720947265625, 0.53790283203125, 0.568084716796875, 0.5982666015625, 0.628448486328125, 0.65863037109375, 0.688812255859375, 0.718994140625, 0.749176025390625, 0.77935791015625, 0.809539794921875, 0.8397216796875, 0.869903564453125, 0.90008544921875, 0.930267333984375, 0.96044921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 5.0, 3.0, 6.0, 8.0, 15.0, 13.0, 16.0, 20.0, 18.0, 26.0, 31.0, 37.0, 32.0, 42.0, 38.0, 45.0, 68.0, 64.0, 59.0, 61.0, 54.0, 56.0, 34.0, 39.0, 31.0, 19.0, 22.0, 18.0, 26.0, 12.0, 17.0, 8.0, 4.0, 11.0, 5.0, 7.0, 3.0, 6.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.2449951171875, -0.23816299438476562, -0.23133087158203125, -0.22449874877929688, -0.2176666259765625, -0.21083450317382812, -0.20400238037109375, -0.19717025756835938, -0.190338134765625, -0.18350601196289062, -0.17667388916015625, -0.16984176635742188, -0.1630096435546875, -0.15617752075195312, -0.14934539794921875, -0.14251327514648438, -0.13568115234375, -0.12884902954101562, -0.12201690673828125, -0.11518478393554688, -0.1083526611328125, -0.10152053833007812, -0.09468841552734375, -0.08785629272460938, -0.081024169921875, -0.07419204711914062, -0.06735992431640625, -0.060527801513671875, -0.0536956787109375, -0.046863555908203125, -0.04003143310546875, -0.033199310302734375, -0.0263671875, -0.019535064697265625, -0.01270294189453125, -0.005870819091796875, 0.0009613037109375, 0.007793426513671875, 0.01462554931640625, 0.021457672119140625, 0.028289794921875, 0.035121917724609375, 0.04195404052734375, 0.048786163330078125, 0.0556182861328125, 0.062450408935546875, 0.06928253173828125, 0.07611465454101562, 0.08294677734375, 0.08977890014648438, 0.09661102294921875, 0.10344314575195312, 0.1102752685546875, 0.11710739135742188, 0.12393951416015625, 0.13077163696289062, 0.137603759765625, 0.14443588256835938, 0.15126800537109375, 0.15810012817382812, 0.1649322509765625, 0.17176437377929688, 0.17859649658203125, 0.18542861938476562, 0.1922607421875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 71.0, 536.0, 370.0, 27.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.06617546081543, -24.51956558227539, -23.97295570373535, -23.426345825195312, -22.879737854003906, -22.333127975463867, -21.786518096923828, -21.23990821838379, -20.69329833984375, -20.14668846130371, -19.600078582763672, -19.053470611572266, -18.506860733032227, -17.960250854492188, -17.41364097595215, -16.86703109741211, -16.320423126220703, -15.773813247680664, -15.227204322814941, -14.680594444274902, -14.133984565734863, -13.58737564086914, -13.040765762329102, -12.494155883789062, -11.947546005249023, -11.400936126708984, -10.854327201843262, -10.307717323303223, -9.761107444763184, -9.214498519897461, -8.667888641357422, -8.121278762817383, -7.57466983795166, -7.028060436248779, -6.48145055770874, -5.934841156005859, -5.38823127746582, -4.8416218757629395, -4.295012474060059, -3.7484028339385986, -3.2017931938171387, -2.6551835536956787, -2.1085739135742188, -1.561964511871338, -1.015354871749878, -0.46874523162841797, 0.07786417007446289, 0.6244738101959229, 1.1710834503173828, 1.7176930904388428, 2.2643027305603027, 2.8109121322631836, 3.3575217723846436, 3.9041314125061035, 4.450740814208984, 4.997350692749023, 5.543960094451904, 6.090569496154785, 6.637179374694824, 7.183788776397705, 7.730398178100586, 8.277008056640625, 8.823617935180664, 9.370226860046387, 9.916836738586426]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 5.0, 2.0, 8.0, 6.0, 4.0, 12.0, 11.0, 10.0, 17.0, 15.0, 31.0, 28.0, 24.0, 18.0, 31.0, 31.0, 33.0, 40.0, 40.0, 39.0, 48.0, 43.0, 43.0, 40.0, 45.0, 29.0, 48.0, 38.0, 33.0, 37.0, 30.0, 23.0, 23.0, 20.0, 14.0, 11.0, 8.0, 7.0, 10.0, 14.0, 5.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.0680222511291504, -2.9741525650024414, -2.8802831172943115, -2.7864134311676025, -2.6925439834594727, -2.5986742973327637, -2.5048046112060547, -2.410935163497925, -2.317065715789795, -2.223196029663086, -2.129326581954956, -2.035456895828247, -1.9415874481201172, -1.8477177619934082, -1.7538481950759888, -1.6599786281585693, -1.5661089420318604, -1.472239375114441, -1.3783698081970215, -1.2845001220703125, -1.1906306743621826, -1.0967609882354736, -1.0028914213180542, -0.9090218544006348, -0.8151522874832153, -0.7212827205657959, -0.6274131536483765, -0.5335435271263123, -0.4396739602088928, -0.3458043932914734, -0.2519347667694092, -0.15806519985198975, -0.06419539451599121, 0.029674187302589417, 0.12354376912117004, 0.21741336584091187, 0.3112829327583313, 0.40515249967575073, 0.49902212619781494, 0.5928916931152344, 0.6867612600326538, 0.7806308269500732, 0.8745003938674927, 0.9683700203895569, 1.062239646911621, 1.156109094619751, 1.24997878074646, 1.3438483476638794, 1.4377179145812988, 1.5315874814987183, 1.6254570484161377, 1.7193267345428467, 1.8131961822509766, 1.9070658683776855, 2.0009355545043945, 2.0948050022125244, 2.1886744499206543, 2.2825441360473633, 2.376413583755493, 2.470283269882202, 2.564152717590332, 2.658022403717041, 2.75189208984375, 2.84576153755188, 2.939631223678589]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 10.0, 8.0, 15.0, 27.0, 22.0, 48.0, 47.0, 89.0, 111.0, 158.0, 271.0, 409.0, 862.0, 1744.0, 4696.0, 15691.0, 73557.0, 604879.0, 2928641.0, 479315.0, 62428.0, 13599.0, 4208.0, 1602.0, 719.0, 381.0, 233.0, 152.0, 102.0, 65.0, 53.0, 33.0, 28.0, 14.0, 14.0, 14.0, 8.0, 6.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.1627197265625, -1.120361328125, -1.0780029296875, -1.03564453125, -0.9932861328125, -0.950927734375, -0.9085693359375, -0.8662109375, -0.8238525390625, -0.781494140625, -0.7391357421875, -0.69677734375, -0.6544189453125, -0.612060546875, -0.5697021484375, -0.52734375, -0.4849853515625, -0.442626953125, -0.4002685546875, -0.35791015625, -0.3155517578125, -0.273193359375, -0.2308349609375, -0.1884765625, -0.1461181640625, -0.103759765625, -0.0614013671875, -0.01904296875, 0.0233154296875, 0.065673828125, 0.1080322265625, 0.150390625, 0.1927490234375, 0.235107421875, 0.2774658203125, 0.31982421875, 0.3621826171875, 0.404541015625, 0.4468994140625, 0.4892578125, 0.5316162109375, 0.573974609375, 0.6163330078125, 0.65869140625, 0.7010498046875, 0.743408203125, 0.7857666015625, 0.828125, 0.8704833984375, 0.912841796875, 0.9552001953125, 0.99755859375, 1.0399169921875, 1.082275390625, 1.1246337890625, 1.1669921875, 1.2093505859375, 1.251708984375, 1.2940673828125, 1.33642578125, 1.3787841796875, 1.421142578125, 1.4635009765625, 1.505859375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 8.0, 11.0, 16.0, 8.0, 15.0, 19.0, 26.0, 29.0, 29.0, 40.0, 49.0, 51.0, 71.0, 55.0, 48.0, 53.0, 56.0, 61.0, 60.0, 51.0, 51.0, 35.0, 33.0, 25.0, 20.0, 18.0, 12.0, 13.0, 8.0, 7.0, 6.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5147781372070312, -0.4983062744140625, -0.48183441162109375, -0.465362548828125, -0.44889068603515625, -0.4324188232421875, -0.41594696044921875, -0.39947509765625, -0.38300323486328125, -0.3665313720703125, -0.35005950927734375, -0.333587646484375, -0.31711578369140625, -0.3006439208984375, -0.28417205810546875, -0.2677001953125, -0.25122833251953125, -0.2347564697265625, -0.21828460693359375, -0.201812744140625, -0.18534088134765625, -0.1688690185546875, -0.15239715576171875, -0.13592529296875, -0.11945343017578125, -0.1029815673828125, -0.08650970458984375, -0.070037841796875, -0.05356597900390625, -0.0370941162109375, -0.02062225341796875, -0.004150390625, 0.01232147216796875, 0.0287933349609375, 0.04526519775390625, 0.061737060546875, 0.07820892333984375, 0.0946807861328125, 0.11115264892578125, 0.12762451171875, 0.14409637451171875, 0.1605682373046875, 0.17704010009765625, 0.193511962890625, 0.20998382568359375, 0.2264556884765625, 0.24292755126953125, 0.2593994140625, 0.27587127685546875, 0.2923431396484375, 0.30881500244140625, 0.325286865234375, 0.34175872802734375, 0.3582305908203125, 0.37470245361328125, 0.39117431640625, 0.40764617919921875, 0.4241180419921875, 0.44058990478515625, 0.457061767578125, 0.47353363037109375, 0.4900054931640625, 0.5064773559570312, 0.52294921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 6.0, 21.0, 17.0, 33.0, 56.0, 103.0, 208.0, 367.0, 813.0, 1931.0, 5711.0, 19805.0, 79772.0, 381731.0, 1721793.0, 1546447.0, 337316.0, 71942.0, 17724.0, 5129.0, 1792.0, 778.0, 336.0, 180.0, 102.0, 66.0, 36.0, 24.0, 14.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.32977294921875, -1.2894287109375, -1.24908447265625, -1.208740234375, -1.16839599609375, -1.1280517578125, -1.08770751953125, -1.04736328125, -1.00701904296875, -0.9666748046875, -0.92633056640625, -0.885986328125, -0.84564208984375, -0.8052978515625, -0.76495361328125, -0.724609375, -0.68426513671875, -0.6439208984375, -0.60357666015625, -0.563232421875, -0.52288818359375, -0.4825439453125, -0.44219970703125, -0.40185546875, -0.36151123046875, -0.3211669921875, -0.28082275390625, -0.240478515625, -0.20013427734375, -0.1597900390625, -0.11944580078125, -0.0791015625, -0.03875732421875, 0.0015869140625, 0.04193115234375, 0.082275390625, 0.12261962890625, 0.1629638671875, 0.20330810546875, 0.24365234375, 0.28399658203125, 0.3243408203125, 0.36468505859375, 0.405029296875, 0.44537353515625, 0.4857177734375, 0.52606201171875, 0.56640625, 0.60675048828125, 0.6470947265625, 0.68743896484375, 0.727783203125, 0.76812744140625, 0.8084716796875, 0.84881591796875, 0.88916015625, 0.92950439453125, 0.9698486328125, 1.01019287109375, 1.050537109375, 1.09088134765625, 1.1312255859375, 1.17156982421875, 1.2119140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 5.0, 13.0, 9.0, 22.0, 23.0, 30.0, 44.0, 69.0, 94.0, 105.0, 177.0, 228.0, 278.0, 359.0, 461.0, 465.0, 386.0, 275.0, 249.0, 180.0, 163.0, 92.0, 93.0, 70.0, 48.0, 37.0, 24.0, 18.0, 13.0, 12.0, 6.0, 6.0, 5.0, 2.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6384658813476562, -0.6172637939453125, -0.5960617065429688, -0.574859619140625, -0.5536575317382812, -0.5324554443359375, -0.5112533569335938, -0.49005126953125, -0.46884918212890625, -0.4476470947265625, -0.42644500732421875, -0.405242919921875, -0.38404083251953125, -0.3628387451171875, -0.34163665771484375, -0.3204345703125, -0.29923248291015625, -0.2780303955078125, -0.25682830810546875, -0.235626220703125, -0.21442413330078125, -0.1932220458984375, -0.17201995849609375, -0.15081787109375, -0.12961578369140625, -0.1084136962890625, -0.08721160888671875, -0.066009521484375, -0.04480743408203125, -0.0236053466796875, -0.00240325927734375, 0.018798828125, 0.04000091552734375, 0.0612030029296875, 0.08240509033203125, 0.103607177734375, 0.12480926513671875, 0.1460113525390625, 0.16721343994140625, 0.18841552734375, 0.20961761474609375, 0.2308197021484375, 0.25202178955078125, 0.273223876953125, 0.29442596435546875, 0.3156280517578125, 0.33683013916015625, 0.3580322265625, 0.37923431396484375, 0.4004364013671875, 0.42163848876953125, 0.442840576171875, 0.46404266357421875, 0.4852447509765625, 0.5064468383789062, 0.52764892578125, 0.5488510131835938, 0.5700531005859375, 0.5912551879882812, 0.612457275390625, 0.6336593627929688, 0.6548614501953125, 0.6760635375976562, 0.697265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 12.0, 103.0, 414.0, 370.0, 94.0, 16.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.4108829498291, -17.938404083251953, -17.465925216674805, -16.993446350097656, -16.520967483520508, -16.04848861694336, -15.576010704040527, -15.103531837463379, -14.63105297088623, -14.158574104309082, -13.686095237731934, -13.213617324829102, -12.741138458251953, -12.268659591674805, -11.796180725097656, -11.323701858520508, -10.85122299194336, -10.378744125366211, -9.906265258789062, -9.433786392211914, -8.961308479309082, -8.488829612731934, -8.016350746154785, -7.543871879577637, -7.071393966674805, -6.598915100097656, -6.126436710357666, -5.653957843780518, -5.181478977203369, -4.709000587463379, -4.2365217208862305, -3.764042854309082, -3.2915639877319336, -2.8190853595733643, -2.346606492996216, -1.8741278648376465, -1.4016491174697876, -0.9291703701019287, -0.4566917419433594, 0.015787124633789062, 0.4882657527923584, 0.9607445001602173, 1.4332232475280762, 1.9057018756866455, 2.378180503845215, 2.8506593704223633, 3.3231379985809326, 3.795616865158081, 4.26809549331665, 4.740574359893799, 5.213052749633789, 5.6855316162109375, 6.158010482788086, 6.630489349365234, 7.102967739105225, 7.575446605682373, 8.047924995422363, 8.520403861999512, 8.99288272857666, 9.465360641479492, 9.93783950805664, 10.410318374633789, 10.882797241210938, 11.355276107788086, 11.827754974365234]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 9.0, 8.0, 12.0, 20.0, 10.0, 22.0, 23.0, 20.0, 23.0, 32.0, 31.0, 38.0, 41.0, 34.0, 48.0, 48.0, 53.0, 40.0, 42.0, 52.0, 37.0, 52.0, 37.0, 30.0, 38.0, 23.0, 27.0, 19.0, 20.0, 15.0, 11.0, 14.0, 13.0, 8.0, 17.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.070319414138794, -2.000481128692627, -1.930643081665039, -1.8608049154281616, -1.7909667491912842, -1.7211284637451172, -1.6512902975082397, -1.5814521312713623, -1.5116139650344849, -1.4417757987976074, -1.37193763256073, -1.3020994663238525, -1.2322611808776855, -1.1624231338500977, -1.0925848484039307, -1.0227466821670532, -0.9529085159301758, -0.8830703496932983, -0.8132321834564209, -0.7433939576148987, -0.6735557913780212, -0.6037176251411438, -0.5338793992996216, -0.46404123306274414, -0.3942030668258667, -0.32436490058898926, -0.25452670454978943, -0.1846885234117508, -0.11485034227371216, -0.04501217603683472, 0.024826020002365112, 0.09466421604156494, 0.16450214385986328, 0.23434032499790192, 0.30417850613594055, 0.3740167021751404, 0.4438548684120178, 0.5136930346488953, 0.5835312604904175, 0.6533694267272949, 0.7232075929641724, 0.7930457592010498, 0.8628839254379272, 0.9327221512794495, 1.0025603771209717, 1.0723984241485596, 1.1422367095947266, 1.212074875831604, 1.2819130420684814, 1.3517512083053589, 1.4215893745422363, 1.4914275407791138, 1.5612657070159912, 1.6311039924621582, 1.7009421586990356, 1.770780324935913, 1.8406184911727905, 1.910456657409668, 1.9802948236465454, 2.050132989883423, 2.11997127532959, 2.1898093223571777, 2.2596476078033447, 2.3294858932495117, 2.3993239402770996]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 7.0, 14.0, 26.0, 41.0, 79.0, 147.0, 382.0, 866.0, 2185.0, 5658.0, 16915.0, 85325.0, 482121.0, 375312.0, 58284.0, 13298.0, 4717.0, 1797.0, 752.0, 302.0, 139.0, 69.0, 29.0, 21.0, 16.0, 10.0, 8.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.466796875, -2.38946533203125, -2.3121337890625, -2.23480224609375, -2.157470703125, -2.08013916015625, -2.0028076171875, -1.92547607421875, -1.84814453125, -1.77081298828125, -1.6934814453125, -1.61614990234375, -1.538818359375, -1.46148681640625, -1.3841552734375, -1.30682373046875, -1.2294921875, -1.15216064453125, -1.0748291015625, -0.99749755859375, -0.920166015625, -0.84283447265625, -0.7655029296875, -0.68817138671875, -0.61083984375, -0.53350830078125, -0.4561767578125, -0.37884521484375, -0.301513671875, -0.22418212890625, -0.1468505859375, -0.06951904296875, 0.0078125, 0.08514404296875, 0.1624755859375, 0.23980712890625, 0.317138671875, 0.39447021484375, 0.4718017578125, 0.54913330078125, 0.62646484375, 0.70379638671875, 0.7811279296875, 0.85845947265625, 0.935791015625, 1.01312255859375, 1.0904541015625, 1.16778564453125, 1.2451171875, 1.32244873046875, 1.3997802734375, 1.47711181640625, 1.554443359375, 1.63177490234375, 1.7091064453125, 1.78643798828125, 1.86376953125, 1.94110107421875, 2.0184326171875, 2.09576416015625, 2.173095703125, 2.25042724609375, 2.3277587890625, 2.40509033203125, 2.482421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 11.0, 15.0, 14.0, 22.0, 27.0, 29.0, 30.0, 43.0, 54.0, 67.0, 59.0, 68.0, 56.0, 81.0, 62.0, 70.0, 68.0, 44.0, 33.0, 37.0, 26.0, 20.0, 14.0, 15.0, 10.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.642578125, -0.6239776611328125, -0.605377197265625, -0.5867767333984375, -0.56817626953125, -0.5495758056640625, -0.530975341796875, -0.5123748779296875, -0.4937744140625, -0.4751739501953125, -0.456573486328125, -0.4379730224609375, -0.41937255859375, -0.4007720947265625, -0.382171630859375, -0.3635711669921875, -0.344970703125, -0.3263702392578125, -0.307769775390625, -0.2891693115234375, -0.27056884765625, -0.2519683837890625, -0.233367919921875, -0.2147674560546875, -0.1961669921875, -0.1775665283203125, -0.158966064453125, -0.1403656005859375, -0.12176513671875, -0.1031646728515625, -0.084564208984375, -0.0659637451171875, -0.04736328125, -0.0287628173828125, -0.010162353515625, 0.0084381103515625, 0.02703857421875, 0.0456390380859375, 0.064239501953125, 0.0828399658203125, 0.1014404296875, 0.1200408935546875, 0.138641357421875, 0.1572418212890625, 0.17584228515625, 0.1944427490234375, 0.213043212890625, 0.2316436767578125, 0.250244140625, 0.2688446044921875, 0.287445068359375, 0.3060455322265625, 0.32464599609375, 0.3432464599609375, 0.361846923828125, 0.3804473876953125, 0.3990478515625, 0.4176483154296875, 0.436248779296875, 0.4548492431640625, 0.47344970703125, 0.4920501708984375, 0.510650634765625, 0.5292510986328125, 0.5478515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 6.0, 6.0, 8.0, 5.0, 14.0, 10.0, 18.0, 21.0, 33.0, 53.0, 80.0, 126.0, 188.0, 374.0, 712.0, 1451.0, 3008.0, 6141.0, 13874.0, 37405.0, 128467.0, 355691.0, 332053.0, 111543.0, 33000.0, 12789.0, 5713.0, 2813.0, 1400.0, 668.0, 347.0, 169.0, 134.0, 62.0, 48.0, 42.0, 18.0, 17.0, 12.0, 11.0, 5.0, 6.0, 6.0, 4.0, 0.0, 7.0, 0.0, 1.0, 2.0], "bins": [-1.677734375, -1.63232421875, -1.5869140625, -1.54150390625, -1.49609375, -1.45068359375, -1.4052734375, -1.35986328125, -1.314453125, -1.26904296875, -1.2236328125, -1.17822265625, -1.1328125, -1.08740234375, -1.0419921875, -0.99658203125, -0.951171875, -0.90576171875, -0.8603515625, -0.81494140625, -0.76953125, -0.72412109375, -0.6787109375, -0.63330078125, -0.587890625, -0.54248046875, -0.4970703125, -0.45166015625, -0.40625, -0.36083984375, -0.3154296875, -0.27001953125, -0.224609375, -0.17919921875, -0.1337890625, -0.08837890625, -0.04296875, 0.00244140625, 0.0478515625, 0.09326171875, 0.138671875, 0.18408203125, 0.2294921875, 0.27490234375, 0.3203125, 0.36572265625, 0.4111328125, 0.45654296875, 0.501953125, 0.54736328125, 0.5927734375, 0.63818359375, 0.68359375, 0.72900390625, 0.7744140625, 0.81982421875, 0.865234375, 0.91064453125, 0.9560546875, 1.00146484375, 1.046875, 1.09228515625, 1.1376953125, 1.18310546875, 1.228515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 9.0, 6.0, 17.0, 10.0, 19.0, 22.0, 19.0, 32.0, 29.0, 41.0, 42.0, 31.0, 46.0, 59.0, 55.0, 64.0, 50.0, 56.0, 55.0, 42.0, 43.0, 41.0, 28.0, 36.0, 20.0, 20.0, 19.0, 18.0, 18.0, 10.0, 10.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.943359375, -0.9108123779296875, -0.878265380859375, -0.8457183837890625, -0.81317138671875, -0.7806243896484375, -0.748077392578125, -0.7155303955078125, -0.6829833984375, -0.6504364013671875, -0.617889404296875, -0.5853424072265625, -0.55279541015625, -0.5202484130859375, -0.487701416015625, -0.4551544189453125, -0.422607421875, -0.3900604248046875, -0.357513427734375, -0.3249664306640625, -0.29241943359375, -0.2598724365234375, -0.227325439453125, -0.1947784423828125, -0.1622314453125, -0.1296844482421875, -0.097137451171875, -0.0645904541015625, -0.03204345703125, 0.0005035400390625, 0.033050537109375, 0.0655975341796875, 0.09814453125, 0.1306915283203125, 0.163238525390625, 0.1957855224609375, 0.22833251953125, 0.2608795166015625, 0.293426513671875, 0.3259735107421875, 0.3585205078125, 0.3910675048828125, 0.423614501953125, 0.4561614990234375, 0.48870849609375, 0.5212554931640625, 0.553802490234375, 0.5863494873046875, 0.618896484375, 0.6514434814453125, 0.683990478515625, 0.7165374755859375, 0.74908447265625, 0.7816314697265625, 0.814178466796875, 0.8467254638671875, 0.8792724609375, 0.9118194580078125, 0.944366455078125, 0.9769134521484375, 1.00946044921875, 1.0420074462890625, 1.074554443359375, 1.1071014404296875, 1.1396484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 5.0, 26.0, 38.0, 50.0, 85.0, 154.0, 225.0, 429.0, 759.0, 1522.0, 4145.0, 17709.0, 238010.0, 719525.0, 53035.0, 7795.0, 2502.0, 1163.0, 586.0, 316.0, 186.0, 102.0, 66.0, 32.0, 25.0, 14.0, 14.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.173828125, -2.10845947265625, -2.0430908203125, -1.97772216796875, -1.912353515625, -1.84698486328125, -1.7816162109375, -1.71624755859375, -1.65087890625, -1.58551025390625, -1.5201416015625, -1.45477294921875, -1.389404296875, -1.32403564453125, -1.2586669921875, -1.19329833984375, -1.1279296875, -1.06256103515625, -0.9971923828125, -0.93182373046875, -0.866455078125, -0.80108642578125, -0.7357177734375, -0.67034912109375, -0.60498046875, -0.53961181640625, -0.4742431640625, -0.40887451171875, -0.343505859375, -0.27813720703125, -0.2127685546875, -0.14739990234375, -0.08203125, -0.01666259765625, 0.0487060546875, 0.11407470703125, 0.179443359375, 0.24481201171875, 0.3101806640625, 0.37554931640625, 0.44091796875, 0.50628662109375, 0.5716552734375, 0.63702392578125, 0.702392578125, 0.76776123046875, 0.8331298828125, 0.89849853515625, 0.9638671875, 1.02923583984375, 1.0946044921875, 1.15997314453125, 1.225341796875, 1.29071044921875, 1.3560791015625, 1.42144775390625, 1.48681640625, 1.55218505859375, 1.6175537109375, 1.68292236328125, 1.748291015625, 1.81365966796875, 1.8790283203125, 1.94439697265625, 2.009765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 6.0, 12.0, 12.0, 19.0, 62.0, 136.0, 269.0, 252.0, 116.0, 46.0, 18.0, 13.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00028252601623535156, -0.00027577951550483704, -0.0002690330147743225, -0.000262286514043808, -0.00025554001331329346, -0.00024879351258277893, -0.0002420470118522644, -0.00023530051112174988, -0.00022855401039123535, -0.00022180750966072083, -0.0002150610089302063, -0.00020831450819969177, -0.00020156800746917725, -0.00019482150673866272, -0.0001880750060081482, -0.00018132850527763367, -0.00017458200454711914, -0.00016783550381660461, -0.0001610890030860901, -0.00015434250235557556, -0.00014759600162506104, -0.0001408495008945465, -0.00013410300016403198, -0.00012735649943351746, -0.00012060999870300293, -0.0001138634979724884, -0.00010711699724197388, -0.00010037049651145935, -9.362399578094482e-05, -8.68774950504303e-05, -8.013099431991577e-05, -7.338449358940125e-05, -6.663799285888672e-05, -5.989149212837219e-05, -5.3144991397857666e-05, -4.639849066734314e-05, -3.965198993682861e-05, -3.290548920631409e-05, -2.615898847579956e-05, -1.9412487745285034e-05, -1.2665987014770508e-05, -5.9194862842559814e-06, 8.270144462585449e-07, 7.573515176773071e-06, 1.4320015907287598e-05, 2.1066516637802124e-05, 2.781301736831665e-05, 3.455951809883118e-05, 4.13060188293457e-05, 4.805251955986023e-05, 5.4799020290374756e-05, 6.154552102088928e-05, 6.829202175140381e-05, 7.503852248191833e-05, 8.178502321243286e-05, 8.853152394294739e-05, 9.527802467346191e-05, 0.00010202452540397644, 0.00010877102613449097, 0.00011551752686500549, 0.00012226402759552002, 0.00012901052832603455, 0.00013575702905654907, 0.0001425035297870636, 0.00014925003051757812]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 9.0, 7.0, 8.0, 26.0, 29.0, 46.0, 87.0, 121.0, 200.0, 422.0, 804.0, 1603.0, 3424.0, 7790.0, 20097.0, 60116.0, 178145.0, 335669.0, 272430.0, 109858.0, 35272.0, 12404.0, 5168.0, 2305.0, 1158.0, 576.0, 317.0, 192.0, 98.0, 58.0, 29.0, 23.0, 13.0, 16.0, 9.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5771484375, -0.5583877563476562, -0.5396270751953125, -0.5208663940429688, -0.502105712890625, -0.48334503173828125, -0.4645843505859375, -0.44582366943359375, -0.42706298828125, -0.40830230712890625, -0.3895416259765625, -0.37078094482421875, -0.352020263671875, -0.33325958251953125, -0.3144989013671875, -0.29573822021484375, -0.2769775390625, -0.25821685791015625, -0.2394561767578125, -0.22069549560546875, -0.201934814453125, -0.18317413330078125, -0.1644134521484375, -0.14565277099609375, -0.12689208984375, -0.10813140869140625, -0.0893707275390625, -0.07061004638671875, -0.051849365234375, -0.03308868408203125, -0.0143280029296875, 0.00443267822265625, 0.023193359375, 0.04195404052734375, 0.0607147216796875, 0.07947540283203125, 0.098236083984375, 0.11699676513671875, 0.1357574462890625, 0.15451812744140625, 0.17327880859375, 0.19203948974609375, 0.2108001708984375, 0.22956085205078125, 0.248321533203125, 0.26708221435546875, 0.2858428955078125, 0.30460357666015625, 0.3233642578125, 0.34212493896484375, 0.3608856201171875, 0.37964630126953125, 0.398406982421875, 0.41716766357421875, 0.4359283447265625, 0.45468902587890625, 0.47344970703125, 0.49221038818359375, 0.5109710693359375, 0.5297317504882812, 0.548492431640625, 0.5672531127929688, 0.5860137939453125, 0.6047744750976562, 0.62353515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 4.0, 1.0, 6.0, 14.0, 11.0, 20.0, 30.0, 25.0, 36.0, 37.0, 50.0, 66.0, 69.0, 59.0, 79.0, 71.0, 69.0, 51.0, 63.0, 50.0, 37.0, 40.0, 29.0, 22.0, 17.0, 13.0, 7.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.38330078125, -0.3715782165527344, -0.35985565185546875, -0.3481330871582031, -0.3364105224609375, -0.3246879577636719, -0.31296539306640625, -0.3012428283691406, -0.289520263671875, -0.2777976989746094, -0.26607513427734375, -0.2543525695800781, -0.2426300048828125, -0.23090744018554688, -0.21918487548828125, -0.20746231079101562, -0.19573974609375, -0.18401718139648438, -0.17229461669921875, -0.16057205200195312, -0.1488494873046875, -0.13712692260742188, -0.12540435791015625, -0.11368179321289062, -0.101959228515625, -0.09023666381835938, -0.07851409912109375, -0.06679153442382812, -0.0550689697265625, -0.043346405029296875, -0.03162384033203125, -0.019901275634765625, -0.0081787109375, 0.003543853759765625, 0.01526641845703125, 0.026988983154296875, 0.0387115478515625, 0.050434112548828125, 0.06215667724609375, 0.07387924194335938, 0.085601806640625, 0.09732437133789062, 0.10904693603515625, 0.12076950073242188, 0.1324920654296875, 0.14421463012695312, 0.15593719482421875, 0.16765975952148438, 0.17938232421875, 0.19110488891601562, 0.20282745361328125, 0.21455001831054688, 0.2262725830078125, 0.23799514770507812, 0.24971771240234375, 0.2614402770996094, 0.273162841796875, 0.2848854064941406, 0.29660797119140625, 0.3083305358886719, 0.3200531005859375, 0.3317756652832031, 0.34349822998046875, 0.3552207946777344, 0.366943359375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 20.0, 112.0, 385.0, 371.0, 91.0, 22.0, 8.0, 0.0, 2.0, 2.0], "bins": [-26.549686431884766, -26.083263397216797, -25.616840362548828, -25.150415420532227, -24.683992385864258, -24.21756935119629, -23.75114631652832, -23.28472137451172, -22.81829833984375, -22.35187530517578, -21.885452270507812, -21.41902732849121, -20.952604293823242, -20.486181259155273, -20.019758224487305, -19.553333282470703, -19.086910247802734, -18.620487213134766, -18.154064178466797, -17.687639236450195, -17.221216201782227, -16.754793167114258, -16.28837013244629, -15.821946144104004, -15.355523109436035, -14.889100074768066, -14.422676086425781, -13.956253051757812, -13.489829063415527, -13.023406028747559, -12.556982040405273, -12.090559005737305, -11.624135971069336, -11.157712936401367, -10.691288948059082, -10.224865913391113, -9.758441925048828, -9.29201889038086, -8.825594902038574, -8.359171867370605, -7.89274787902832, -7.426324367523193, -6.959900856018066, -6.4934773445129395, -6.0270538330078125, -5.560630798339844, -5.094206809997559, -4.62778377532959, -4.161359786987305, -3.6949362754821777, -3.228512763977051, -2.762089252471924, -2.295665740966797, -1.829242467880249, -1.362818956375122, -0.8963954448699951, -0.42997217178344727, 0.0364513099193573, 0.5028747916221619, 0.969298243522644, 1.435721755027771, 1.9021451473236084, 2.3685686588287354, 2.8349921703338623, 3.3014156818389893]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 10.0, 11.0, 15.0, 9.0, 12.0, 25.0, 21.0, 21.0, 16.0, 15.0, 32.0, 47.0, 43.0, 45.0, 30.0, 51.0, 41.0, 46.0, 35.0, 42.0, 53.0, 35.0, 33.0, 36.0, 32.0, 33.0, 36.0, 27.0, 13.0, 22.0, 12.0, 13.0, 13.0, 11.0, 6.0, 12.0, 5.0, 2.0, 8.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.858982563018799, -2.7792370319366455, -2.6994917392730713, -2.619746208190918, -2.5400009155273438, -2.4602553844451904, -2.380510091781616, -2.300764560699463, -2.2210192680358887, -2.1412737369537354, -2.061528444290161, -1.9817830324172974, -1.9020376205444336, -1.8222920894622803, -1.7425466775894165, -1.6628012657165527, -1.5830557346343994, -1.5033103227615356, -1.4235649108886719, -1.343819499015808, -1.2640740871429443, -1.184328556060791, -1.1045831441879272, -1.0248377323150635, -0.9450923204421997, -0.8653469085693359, -0.7856014966964722, -0.7058560252189636, -0.6261106133460999, -0.5463652014732361, -0.4666197597980499, -0.38687431812286377, -0.30712890625, -0.22738347947597504, -0.14763805270195007, -0.06789262592792511, 0.011852800846099854, 0.09159821271896362, 0.17134365439414978, 0.25108909606933594, 0.3308345079421997, 0.4105799198150635, 0.49032536149024963, 0.5700708031654358, 0.6498162150382996, 0.7295616269111633, 0.8093070983886719, 0.8890525102615356, 0.9687979221343994, 1.0485433340072632, 1.128288745880127, 1.2080341577529907, 1.2877795696258545, 1.3675251007080078, 1.4472705125808716, 1.5270159244537354, 1.6067613363265991, 1.686506748199463, 1.7662521600723267, 1.8459975719451904, 1.9257431030273438, 2.005488395690918, 2.0852339267730713, 2.1649794578552246, 2.244724750518799]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 12.0, 8.0, 10.0, 21.0, 28.0, 25.0, 54.0, 71.0, 122.0, 142.0, 227.0, 337.0, 716.0, 1276.0, 2590.0, 5699.0, 13735.0, 38591.0, 127730.0, 550357.0, 1825813.0, 1228133.0, 282822.0, 73650.0, 24299.0, 9500.0, 4056.0, 1883.0, 999.0, 516.0, 331.0, 167.0, 105.0, 72.0, 53.0, 30.0, 25.0, 22.0, 15.0, 3.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.79150390625, -0.7680740356445312, -0.7446441650390625, -0.7212142944335938, -0.697784423828125, -0.6743545532226562, -0.6509246826171875, -0.6274948120117188, -0.60406494140625, -0.5806350708007812, -0.5572052001953125, -0.5337753295898438, -0.510345458984375, -0.48691558837890625, -0.4634857177734375, -0.44005584716796875, -0.4166259765625, -0.39319610595703125, -0.3697662353515625, -0.34633636474609375, -0.322906494140625, -0.29947662353515625, -0.2760467529296875, -0.25261688232421875, -0.22918701171875, -0.20575714111328125, -0.1823272705078125, -0.15889739990234375, -0.135467529296875, -0.11203765869140625, -0.0886077880859375, -0.06517791748046875, -0.041748046875, -0.01831817626953125, 0.0051116943359375, 0.02854156494140625, 0.051971435546875, 0.07540130615234375, 0.0988311767578125, 0.12226104736328125, 0.14569091796875, 0.16912078857421875, 0.1925506591796875, 0.21598052978515625, 0.239410400390625, 0.26284027099609375, 0.2862701416015625, 0.30970001220703125, 0.3331298828125, 0.35655975341796875, 0.3799896240234375, 0.40341949462890625, 0.426849365234375, 0.45027923583984375, 0.4737091064453125, 0.49713897705078125, 0.52056884765625, 0.5439987182617188, 0.5674285888671875, 0.5908584594726562, 0.614288330078125, 0.6377182006835938, 0.6611480712890625, 0.6845779418945312, 0.7080078125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 11.0, 2.0, 12.0, 12.0, 14.0, 18.0, 29.0, 49.0, 43.0, 43.0, 59.0, 66.0, 49.0, 52.0, 71.0, 58.0, 60.0, 60.0, 54.0, 55.0, 37.0, 24.0, 26.0, 25.0, 21.0, 12.0, 9.0, 11.0, 4.0, 2.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5242462158203125, -0.506988525390625, -0.4897308349609375, -0.47247314453125, -0.4552154541015625, -0.437957763671875, -0.4207000732421875, -0.4034423828125, -0.3861846923828125, -0.368927001953125, -0.3516693115234375, -0.33441162109375, -0.3171539306640625, -0.299896240234375, -0.2826385498046875, -0.265380859375, -0.2481231689453125, -0.230865478515625, -0.2136077880859375, -0.19635009765625, -0.1790924072265625, -0.161834716796875, -0.1445770263671875, -0.1273193359375, -0.1100616455078125, -0.092803955078125, -0.0755462646484375, -0.05828857421875, -0.0410308837890625, -0.023773193359375, -0.0065155029296875, 0.0107421875, 0.0279998779296875, 0.045257568359375, 0.0625152587890625, 0.07977294921875, 0.0970306396484375, 0.114288330078125, 0.1315460205078125, 0.1488037109375, 0.1660614013671875, 0.183319091796875, 0.2005767822265625, 0.21783447265625, 0.2350921630859375, 0.252349853515625, 0.2696075439453125, 0.286865234375, 0.3041229248046875, 0.321380615234375, 0.3386383056640625, 0.35589599609375, 0.3731536865234375, 0.390411376953125, 0.4076690673828125, 0.4249267578125, 0.4421844482421875, 0.459442138671875, 0.4766998291015625, 0.49395751953125, 0.5112152099609375, 0.528472900390625, 0.5457305908203125, 0.56298828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 9.0, 19.0, 35.0, 56.0, 107.0, 177.0, 383.0, 846.0, 2286.0, 8105.0, 37345.0, 212131.0, 1219162.0, 2085442.0, 519408.0, 85590.0, 16579.0, 4140.0, 1351.0, 529.0, 252.0, 139.0, 72.0, 46.0, 26.0, 16.0, 12.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.373046875, -1.3340911865234375, -1.295135498046875, -1.2561798095703125, -1.21722412109375, -1.1782684326171875, -1.139312744140625, -1.1003570556640625, -1.0614013671875, -1.0224456787109375, -0.983489990234375, -0.9445343017578125, -0.90557861328125, -0.8666229248046875, -0.827667236328125, -0.7887115478515625, -0.749755859375, -0.7108001708984375, -0.671844482421875, -0.6328887939453125, -0.59393310546875, -0.5549774169921875, -0.516021728515625, -0.4770660400390625, -0.4381103515625, -0.3991546630859375, -0.360198974609375, -0.3212432861328125, -0.28228759765625, -0.2433319091796875, -0.204376220703125, -0.1654205322265625, -0.12646484375, -0.0875091552734375, -0.048553466796875, -0.0095977783203125, 0.02935791015625, 0.0683135986328125, 0.107269287109375, 0.1462249755859375, 0.1851806640625, 0.2241363525390625, 0.263092041015625, 0.3020477294921875, 0.34100341796875, 0.3799591064453125, 0.418914794921875, 0.4578704833984375, 0.496826171875, 0.5357818603515625, 0.574737548828125, 0.6136932373046875, 0.65264892578125, 0.6916046142578125, 0.730560302734375, 0.7695159912109375, 0.8084716796875, 0.8474273681640625, 0.886383056640625, 0.9253387451171875, 0.96429443359375, 1.0032501220703125, 1.042205810546875, 1.0811614990234375, 1.1201171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 2.0, 5.0, 5.0, 11.0, 14.0, 19.0, 26.0, 46.0, 68.0, 93.0, 125.0, 171.0, 245.0, 291.0, 319.0, 391.0, 454.0, 373.0, 355.0, 262.0, 219.0, 160.0, 113.0, 88.0, 67.0, 46.0, 23.0, 29.0, 15.0, 14.0, 10.0, 12.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7744140625, -0.74810791015625, -0.7218017578125, -0.69549560546875, -0.669189453125, -0.64288330078125, -0.6165771484375, -0.59027099609375, -0.56396484375, -0.53765869140625, -0.5113525390625, -0.48504638671875, -0.458740234375, -0.43243408203125, -0.4061279296875, -0.37982177734375, -0.353515625, -0.32720947265625, -0.3009033203125, -0.27459716796875, -0.248291015625, -0.22198486328125, -0.1956787109375, -0.16937255859375, -0.14306640625, -0.11676025390625, -0.0904541015625, -0.06414794921875, -0.037841796875, -0.01153564453125, 0.0147705078125, 0.04107666015625, 0.0673828125, 0.09368896484375, 0.1199951171875, 0.14630126953125, 0.172607421875, 0.19891357421875, 0.2252197265625, 0.25152587890625, 0.27783203125, 0.30413818359375, 0.3304443359375, 0.35675048828125, 0.383056640625, 0.40936279296875, 0.4356689453125, 0.46197509765625, 0.48828125, 0.51458740234375, 0.5408935546875, 0.56719970703125, 0.593505859375, 0.61981201171875, 0.6461181640625, 0.67242431640625, 0.69873046875, 0.72503662109375, 0.7513427734375, 0.77764892578125, 0.803955078125, 0.83026123046875, 0.8565673828125, 0.88287353515625, 0.9091796875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 8.0, 18.0, 20.0, 44.0, 59.0, 83.0, 99.0, 110.0, 108.0, 113.0, 90.0, 86.0, 58.0, 43.0, 22.0, 17.0, 11.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.126149654388428, -5.982048988342285, -5.837948322296143, -5.693848133087158, -5.549747467041016, -5.405646800994873, -5.2615461349487305, -5.117445468902588, -4.973344802856445, -4.829244136810303, -4.68514347076416, -4.541043281555176, -4.396942615509033, -4.252841949462891, -4.108741283416748, -3.9646406173706055, -3.820540428161621, -3.6764397621154785, -3.532339334487915, -3.3882386684417725, -3.244138240814209, -3.1000375747680664, -2.955936908721924, -2.8118362426757812, -2.6677358150482178, -2.523635149002075, -2.3795347213745117, -2.235434055328369, -2.0913333892822266, -1.947232961654663, -1.8031322956085205, -1.6590317487716675, -1.5149307250976562, -1.3708301782608032, -1.2267296314239502, -1.0826289653778076, -0.9385284185409546, -0.7944278717041016, -0.6503272652626038, -0.506226658821106, -0.36212611198425293, -0.21802553534507751, -0.0739249587059021, 0.07017561793327332, 0.21427619457244873, 0.35837674140930176, 0.5024773478507996, 0.6465779542922974, 0.7906785011291504, 0.9347790479660034, 1.0788795948028564, 1.222980260848999, 1.367080807685852, 1.511181354522705, 1.6552820205688477, 1.7993825674057007, 1.9434831142425537, 2.0875837802886963, 2.2316842079162598, 2.3757848739624023, 2.519885540008545, 2.6639859676361084, 2.808086633682251, 2.9521870613098145, 3.096287727355957]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 2.0, 4.0, 6.0, 10.0, 13.0, 14.0, 16.0, 10.0, 14.0, 20.0, 29.0, 24.0, 26.0, 37.0, 29.0, 44.0, 37.0, 26.0, 40.0, 41.0, 31.0, 52.0, 29.0, 46.0, 44.0, 43.0, 43.0, 39.0, 29.0, 32.0, 24.0, 24.0, 26.0, 15.0, 19.0, 10.0, 13.0, 12.0, 12.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.309464454650879, -2.230226755142212, -2.150989294052124, -2.071751594543457, -1.9925140142440796, -1.9132764339447021, -1.8340388536453247, -1.7548012733459473, -1.6755635738372803, -1.5963259935379028, -1.5170884132385254, -1.4378507137298584, -1.358613133430481, -1.2793755531311035, -1.200137972831726, -1.1209003925323486, -1.0416628122329712, -0.9624252319335938, -0.8831875920295715, -0.8039500117301941, -0.7247123718261719, -0.6454747915267944, -0.566237211227417, -0.4869995713233948, -0.40776199102401733, -0.3285243809223175, -0.24928678572177887, -0.17004919052124023, -0.0908115804195404, -0.011573970317840576, 0.06766360998153687, 0.14690124988555908, 0.22613883018493652, 0.30537644028663635, 0.3846140503883362, 0.4638516306877136, 0.5430892705917358, 0.6223268508911133, 0.7015644311904907, 0.7808020710945129, 0.8600396513938904, 0.9392772316932678, 1.01851487159729, 1.0977524518966675, 1.176990032196045, 1.256227731704712, 1.3354651927947998, 1.4147028923034668, 1.4939404726028442, 1.5731780529022217, 1.6524156332015991, 1.7316532135009766, 1.8108909130096436, 1.890128493309021, 1.9693660736083984, 2.0486037731170654, 2.1278412342071533, 2.2070789337158203, 2.286316394805908, 2.365554094314575, 2.444791555404663, 2.52402925491333, 2.603266716003418, 2.682504415512085, 2.761742115020752]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 8.0, 5.0, 11.0, 12.0, 27.0, 34.0, 53.0, 77.0, 118.0, 254.0, 398.0, 768.0, 1654.0, 3742.0, 9136.0, 23144.0, 62629.0, 165004.0, 326173.0, 270233.0, 114590.0, 42603.0, 16100.0, 6426.0, 2656.0, 1248.0, 611.0, 318.0, 190.0, 116.0, 62.0, 41.0, 36.0, 21.0, 13.0, 8.0, 5.0, 6.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.6435546875, -1.594940185546875, -1.54632568359375, -1.497711181640625, -1.4490966796875, -1.400482177734375, -1.35186767578125, -1.303253173828125, -1.254638671875, -1.206024169921875, -1.15740966796875, -1.108795166015625, -1.0601806640625, -1.011566162109375, -0.96295166015625, -0.914337158203125, -0.86572265625, -0.817108154296875, -0.76849365234375, -0.719879150390625, -0.6712646484375, -0.622650146484375, -0.57403564453125, -0.525421142578125, -0.476806640625, -0.428192138671875, -0.37957763671875, -0.330963134765625, -0.2823486328125, -0.233734130859375, -0.18511962890625, -0.136505126953125, -0.087890625, -0.039276123046875, 0.00933837890625, 0.057952880859375, 0.1065673828125, 0.155181884765625, 0.20379638671875, 0.252410888671875, 0.301025390625, 0.349639892578125, 0.39825439453125, 0.446868896484375, 0.4954833984375, 0.544097900390625, 0.59271240234375, 0.641326904296875, 0.68994140625, 0.738555908203125, 0.78717041015625, 0.835784912109375, 0.8843994140625, 0.933013916015625, 0.98162841796875, 1.030242919921875, 1.078857421875, 1.127471923828125, 1.17608642578125, 1.224700927734375, 1.2733154296875, 1.321929931640625, 1.37054443359375, 1.419158935546875, 1.4677734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 3.0, 12.0, 20.0, 22.0, 20.0, 26.0, 32.0, 30.0, 33.0, 55.0, 54.0, 51.0, 59.0, 56.0, 53.0, 64.0, 63.0, 57.0, 45.0, 46.0, 39.0, 26.0, 23.0, 29.0, 12.0, 17.0, 12.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48681640625, -0.47115325927734375, -0.4554901123046875, -0.43982696533203125, -0.424163818359375, -0.40850067138671875, -0.3928375244140625, -0.37717437744140625, -0.36151123046875, -0.34584808349609375, -0.3301849365234375, -0.31452178955078125, -0.298858642578125, -0.28319549560546875, -0.2675323486328125, -0.25186920166015625, -0.2362060546875, -0.22054290771484375, -0.2048797607421875, -0.18921661376953125, -0.173553466796875, -0.15789031982421875, -0.1422271728515625, -0.12656402587890625, -0.11090087890625, -0.09523773193359375, -0.0795745849609375, -0.06391143798828125, -0.048248291015625, -0.03258514404296875, -0.0169219970703125, -0.00125885009765625, 0.014404296875, 0.03006744384765625, 0.0457305908203125, 0.06139373779296875, 0.077056884765625, 0.09272003173828125, 0.1083831787109375, 0.12404632568359375, 0.13970947265625, 0.15537261962890625, 0.1710357666015625, 0.18669891357421875, 0.202362060546875, 0.21802520751953125, 0.2336883544921875, 0.24935150146484375, 0.2650146484375, 0.28067779541015625, 0.2963409423828125, 0.31200408935546875, 0.327667236328125, 0.34333038330078125, 0.3589935302734375, 0.37465667724609375, 0.39031982421875, 0.40598297119140625, 0.4216461181640625, 0.43730926513671875, 0.452972412109375, 0.46863555908203125, 0.4842987060546875, 0.49996185302734375, 0.515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 10.0, 10.0, 17.0, 21.0, 17.0, 38.0, 60.0, 86.0, 164.0, 264.0, 516.0, 1015.0, 1903.0, 3713.0, 7316.0, 14493.0, 29491.0, 58592.0, 114167.0, 197285.0, 240098.0, 178022.0, 99873.0, 51100.0, 25092.0, 12424.0, 6178.0, 3036.0, 1603.0, 857.0, 447.0, 255.0, 135.0, 91.0, 53.0, 36.0, 20.0, 19.0, 13.0, 9.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.236328125, -1.20037841796875, -1.1644287109375, -1.12847900390625, -1.092529296875, -1.05657958984375, -1.0206298828125, -0.98468017578125, -0.94873046875, -0.91278076171875, -0.8768310546875, -0.84088134765625, -0.804931640625, -0.76898193359375, -0.7330322265625, -0.69708251953125, -0.6611328125, -0.62518310546875, -0.5892333984375, -0.55328369140625, -0.517333984375, -0.48138427734375, -0.4454345703125, -0.40948486328125, -0.37353515625, -0.33758544921875, -0.3016357421875, -0.26568603515625, -0.229736328125, -0.19378662109375, -0.1578369140625, -0.12188720703125, -0.0859375, -0.04998779296875, -0.0140380859375, 0.02191162109375, 0.057861328125, 0.09381103515625, 0.1297607421875, 0.16571044921875, 0.20166015625, 0.23760986328125, 0.2735595703125, 0.30950927734375, 0.345458984375, 0.38140869140625, 0.4173583984375, 0.45330810546875, 0.4892578125, 0.52520751953125, 0.5611572265625, 0.59710693359375, 0.633056640625, 0.66900634765625, 0.7049560546875, 0.74090576171875, 0.77685546875, 0.81280517578125, 0.8487548828125, 0.88470458984375, 0.920654296875, 0.95660400390625, 0.9925537109375, 1.02850341796875, 1.064453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 12.0, 12.0, 10.0, 23.0, 19.0, 28.0, 22.0, 23.0, 38.0, 25.0, 35.0, 29.0, 37.0, 38.0, 39.0, 42.0, 39.0, 43.0, 41.0, 40.0, 48.0, 38.0, 35.0, 36.0, 29.0, 39.0, 23.0, 30.0, 25.0, 18.0, 11.0, 15.0, 8.0, 4.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8369140625, -0.805908203125, -0.77490234375, -0.743896484375, -0.712890625, -0.681884765625, -0.65087890625, -0.619873046875, -0.5888671875, -0.557861328125, -0.52685546875, -0.495849609375, -0.46484375, -0.433837890625, -0.40283203125, -0.371826171875, -0.3408203125, -0.309814453125, -0.27880859375, -0.247802734375, -0.216796875, -0.185791015625, -0.15478515625, -0.123779296875, -0.0927734375, -0.061767578125, -0.03076171875, 0.000244140625, 0.03125, 0.062255859375, 0.09326171875, 0.124267578125, 0.1552734375, 0.186279296875, 0.21728515625, 0.248291015625, 0.279296875, 0.310302734375, 0.34130859375, 0.372314453125, 0.4033203125, 0.434326171875, 0.46533203125, 0.496337890625, 0.52734375, 0.558349609375, 0.58935546875, 0.620361328125, 0.6513671875, 0.682373046875, 0.71337890625, 0.744384765625, 0.775390625, 0.806396484375, 0.83740234375, 0.868408203125, 0.8994140625, 0.930419921875, 0.96142578125, 0.992431640625, 1.0234375, 1.054443359375, 1.08544921875, 1.116455078125, 1.1474609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 9.0, 13.0, 19.0, 20.0, 32.0, 62.0, 63.0, 108.0, 148.0, 210.0, 322.0, 615.0, 1099.0, 2492.0, 7153.0, 31724.0, 206720.0, 568766.0, 188792.0, 28442.0, 6769.0, 2304.0, 1056.0, 578.0, 390.0, 188.0, 132.0, 118.0, 45.0, 44.0, 41.0, 19.0, 20.0, 15.0, 11.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296875, -1.2513275146484375, -1.205780029296875, -1.1602325439453125, -1.11468505859375, -1.0691375732421875, -1.023590087890625, -0.9780426025390625, -0.9324951171875, -0.8869476318359375, -0.841400146484375, -0.7958526611328125, -0.75030517578125, -0.7047576904296875, -0.659210205078125, -0.6136627197265625, -0.568115234375, -0.5225677490234375, -0.477020263671875, -0.4314727783203125, -0.38592529296875, -0.3403778076171875, -0.294830322265625, -0.2492828369140625, -0.2037353515625, -0.1581878662109375, -0.112640380859375, -0.0670928955078125, -0.02154541015625, 0.0240020751953125, 0.069549560546875, 0.1150970458984375, 0.16064453125, 0.2061920166015625, 0.251739501953125, 0.2972869873046875, 0.34283447265625, 0.3883819580078125, 0.433929443359375, 0.4794769287109375, 0.5250244140625, 0.5705718994140625, 0.616119384765625, 0.6616668701171875, 0.70721435546875, 0.7527618408203125, 0.798309326171875, 0.8438568115234375, 0.889404296875, 0.9349517822265625, 0.980499267578125, 1.0260467529296875, 1.07159423828125, 1.1171417236328125, 1.162689208984375, 1.2082366943359375, 1.2537841796875, 1.2993316650390625, 1.344879150390625, 1.3904266357421875, 1.43597412109375, 1.4815216064453125, 1.527069091796875, 1.5726165771484375, 1.6181640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 11.0, 25.0, 36.0, 91.0, 176.0, 244.0, 206.0, 96.0, 50.0, 23.0, 17.0, 14.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00037384033203125, -0.0003646276891231537, -0.0003554150462150574, -0.00034620240330696106, -0.00033698976039886475, -0.00032777711749076843, -0.0003185644745826721, -0.0003093518316745758, -0.0003001391887664795, -0.0002909265458583832, -0.00028171390295028687, -0.00027250126004219055, -0.00026328861713409424, -0.0002540759742259979, -0.0002448633313179016, -0.0002356506884098053, -0.00022643804550170898, -0.00021722540259361267, -0.00020801275968551636, -0.00019880011677742004, -0.00018958747386932373, -0.00018037483096122742, -0.0001711621880531311, -0.0001619495451450348, -0.00015273690223693848, -0.00014352425932884216, -0.00013431161642074585, -0.00012509897351264954, -0.00011588633060455322, -0.00010667368769645691, -9.74610447883606e-05, -8.824840188026428e-05, -7.903575897216797e-05, -6.982311606407166e-05, -6.061047315597534e-05, -5.139783024787903e-05, -4.2185187339782715e-05, -3.29725444316864e-05, -2.3759901523590088e-05, -1.4547258615493774e-05, -5.334615707397461e-06, 3.8780272006988525e-06, 1.3090670108795166e-05, 2.230331301689148e-05, 3.151595592498779e-05, 4.0728598833084106e-05, 4.994124174118042e-05, 5.9153884649276733e-05, 6.836652755737305e-05, 7.757917046546936e-05, 8.679181337356567e-05, 9.600445628166199e-05, 0.0001052170991897583, 0.00011442974209785461, 0.00012364238500595093, 0.00013285502791404724, 0.00014206767082214355, 0.00015128031373023987, 0.00016049295663833618, 0.0001697055995464325, 0.0001789182424545288, 0.00018813088536262512, 0.00019734352827072144, 0.00020655617117881775, 0.00021576881408691406]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 19.0, 21.0, 31.0, 46.0, 55.0, 108.0, 128.0, 208.0, 323.0, 551.0, 890.0, 1621.0, 2719.0, 5220.0, 10366.0, 20769.0, 42923.0, 86481.0, 155435.0, 216951.0, 209614.0, 141067.0, 76597.0, 37926.0, 18241.0, 9227.0, 4803.0, 2515.0, 1421.0, 882.0, 485.0, 305.0, 206.0, 123.0, 81.0, 52.0, 46.0, 32.0, 18.0, 9.0, 9.0, 7.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.4001960754394531, -0.38681793212890625, -0.3734397888183594, -0.3600616455078125, -0.3466835021972656, -0.33330535888671875, -0.3199272155761719, -0.306549072265625, -0.2931709289550781, -0.27979278564453125, -0.2664146423339844, -0.2530364990234375, -0.23965835571289062, -0.22628021240234375, -0.21290206909179688, -0.19952392578125, -0.18614578247070312, -0.17276763916015625, -0.15938949584960938, -0.1460113525390625, -0.13263320922851562, -0.11925506591796875, -0.10587692260742188, -0.092498779296875, -0.07912063598632812, -0.06574249267578125, -0.052364349365234375, -0.0389862060546875, -0.025608062744140625, -0.01222991943359375, 0.001148223876953125, 0.0145263671875, 0.027904510498046875, 0.04128265380859375, 0.054660797119140625, 0.0680389404296875, 0.08141708374023438, 0.09479522705078125, 0.10817337036132812, 0.121551513671875, 0.13492965698242188, 0.14830780029296875, 0.16168594360351562, 0.1750640869140625, 0.18844223022460938, 0.20182037353515625, 0.21519851684570312, 0.22857666015625, 0.24195480346679688, 0.25533294677734375, 0.2687110900878906, 0.2820892333984375, 0.2954673767089844, 0.30884552001953125, 0.3222236633300781, 0.335601806640625, 0.3489799499511719, 0.36235809326171875, 0.3757362365722656, 0.3891143798828125, 0.4024925231933594, 0.41587066650390625, 0.4292488098144531, 0.442626953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 9.0, 10.0, 8.0, 4.0, 9.0, 21.0, 29.0, 19.0, 29.0, 39.0, 48.0, 51.0, 51.0, 55.0, 64.0, 64.0, 70.0, 55.0, 57.0, 49.0, 39.0, 41.0, 24.0, 27.0, 24.0, 29.0, 15.0, 11.0, 8.0, 11.0, 8.0, 3.0, 2.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3837890625, -0.372039794921875, -0.36029052734375, -0.348541259765625, -0.3367919921875, -0.325042724609375, -0.31329345703125, -0.301544189453125, -0.289794921875, -0.278045654296875, -0.26629638671875, -0.254547119140625, -0.2427978515625, -0.231048583984375, -0.21929931640625, -0.207550048828125, -0.19580078125, -0.184051513671875, -0.17230224609375, -0.160552978515625, -0.1488037109375, -0.137054443359375, -0.12530517578125, -0.113555908203125, -0.101806640625, -0.090057373046875, -0.07830810546875, -0.066558837890625, -0.0548095703125, -0.043060302734375, -0.03131103515625, -0.019561767578125, -0.0078125, 0.003936767578125, 0.01568603515625, 0.027435302734375, 0.0391845703125, 0.050933837890625, 0.06268310546875, 0.074432373046875, 0.086181640625, 0.097930908203125, 0.10968017578125, 0.121429443359375, 0.1331787109375, 0.144927978515625, 0.15667724609375, 0.168426513671875, 0.18017578125, 0.191925048828125, 0.20367431640625, 0.215423583984375, 0.2271728515625, 0.238922119140625, 0.25067138671875, 0.262420654296875, 0.274169921875, 0.285919189453125, 0.29766845703125, 0.309417724609375, 0.3211669921875, 0.332916259765625, 0.34466552734375, 0.356414794921875, 0.3681640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 11.0, 15.0, 20.0, 29.0, 36.0, 42.0, 54.0, 80.0, 98.0, 101.0, 88.0, 83.0, 74.0, 64.0, 49.0, 36.0, 30.0, 25.0, 20.0, 8.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.323822975158691, -5.1911516189575195, -5.058480262756348, -4.925808906555176, -4.793137550354004, -4.660466194152832, -4.52779483795166, -4.395123481750488, -4.262452125549316, -4.1297807693481445, -3.9971094131469727, -3.864438056945801, -3.731766700744629, -3.599095344543457, -3.466423749923706, -3.333752393722534, -3.201080799102783, -3.0684094429016113, -2.9357380867004395, -2.8030667304992676, -2.6703953742980957, -2.537724018096924, -2.405052423477173, -2.272381067276001, -2.139709711074829, -2.0070383548736572, -1.8743669986724854, -1.741695523262024, -1.609024167060852, -1.4763528108596802, -1.3436813354492188, -1.2110099792480469, -1.078338861465454, -0.9456675052642822, -0.8129960894584656, -0.6803246736526489, -0.547653317451477, -0.4149819612503052, -0.2823105454444885, -0.14963912963867188, -0.0169677734375, 0.11570361256599426, 0.24837499856948853, 0.3810463845729828, 0.513717770576477, 0.6463891267776489, 0.7790605425834656, 0.9117319583892822, 1.044403314590454, 1.177074670791626, 1.3097460269927979, 1.4424175024032593, 1.5750888586044312, 1.707760214805603, 1.8404316902160645, 1.9731030464172363, 2.105774402618408, 2.23844575881958, 2.371117115020752, 2.503788471221924, 2.6364598274230957, 2.7691311836242676, 2.9018027782440186, 3.0344741344451904, 3.1671454906463623]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 12.0, 5.0, 13.0, 17.0, 20.0, 21.0, 11.0, 31.0, 29.0, 34.0, 30.0, 41.0, 46.0, 35.0, 40.0, 50.0, 47.0, 52.0, 55.0, 52.0, 58.0, 41.0, 28.0, 31.0, 54.0, 33.0, 17.0, 23.0, 15.0, 9.0, 9.0, 6.0, 12.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3858189582824707, -3.2768642902374268, -3.167909860610962, -3.058955192565918, -2.950000762939453, -2.841046094894409, -2.7320914268493652, -2.6231369972229004, -2.5141823291778564, -2.4052276611328125, -2.2962732315063477, -2.1873185634613037, -2.078364133834839, -1.969409465789795, -1.8604549169540405, -1.7515003681182861, -1.6425458192825317, -1.5335912704467773, -1.424636721611023, -1.3156821727752686, -1.2067275047302246, -1.0977729558944702, -0.9888184070587158, -0.8798637986183167, -0.7709092497825623, -0.6619547009468079, -0.5530000925064087, -0.4440455436706543, -0.3350909650325775, -0.22613638639450073, -0.11718183755874634, -0.008227229118347168, 0.10072731971740723, 0.209681898355484, 0.3186364769935608, 0.4275910258293152, 0.5365456342697144, 0.6455001831054688, 0.7544547319412231, 0.8634093403816223, 0.9723638892173767, 1.0813184976577759, 1.1902730464935303, 1.2992275953292847, 1.408182144165039, 1.517136812210083, 1.6260912418365479, 1.7350459098815918, 1.8440004587173462, 1.9529550075531006, 2.0619096755981445, 2.1708641052246094, 2.2798187732696533, 2.3887734413146973, 2.497727870941162, 2.606682538986206, 2.715636968612671, 2.824591636657715, 2.9335460662841797, 3.0425007343292236, 3.1514551639556885, 3.2604098320007324, 3.3693642616271973, 3.478318929672241, 3.587273597717285]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 9.0, 8.0, 17.0, 21.0, 45.0, 74.0, 90.0, 163.0, 395.0, 1362.0, 11133.0, 253314.0, 3607779.0, 305916.0, 11853.0, 1364.0, 357.0, 136.0, 79.0, 56.0, 35.0, 21.0, 19.0, 11.0, 10.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.2151336669921875, -2.150970458984375, -2.0868072509765625, -2.02264404296875, -1.9584808349609375, -1.894317626953125, -1.8301544189453125, -1.7659912109375, -1.7018280029296875, -1.637664794921875, -1.5735015869140625, -1.50933837890625, -1.4451751708984375, -1.381011962890625, -1.3168487548828125, -1.252685546875, -1.1885223388671875, -1.124359130859375, -1.0601959228515625, -0.99603271484375, -0.9318695068359375, -0.867706298828125, -0.8035430908203125, -0.7393798828125, -0.6752166748046875, -0.611053466796875, -0.5468902587890625, -0.48272705078125, -0.4185638427734375, -0.354400634765625, -0.2902374267578125, -0.22607421875, -0.1619110107421875, -0.097747802734375, -0.0335845947265625, 0.03057861328125, 0.0947418212890625, 0.158905029296875, 0.2230682373046875, 0.2872314453125, 0.3513946533203125, 0.415557861328125, 0.4797210693359375, 0.54388427734375, 0.6080474853515625, 0.672210693359375, 0.7363739013671875, 0.800537109375, 0.8647003173828125, 0.928863525390625, 0.9930267333984375, 1.05718994140625, 1.1213531494140625, 1.185516357421875, 1.2496795654296875, 1.3138427734375, 1.3780059814453125, 1.442169189453125, 1.5063323974609375, 1.57049560546875, 1.6346588134765625, 1.698822021484375, 1.7629852294921875, 1.8271484375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 4.0, 8.0, 8.0, 12.0, 16.0, 15.0, 19.0, 23.0, 23.0, 29.0, 27.0, 46.0, 46.0, 43.0, 64.0, 55.0, 51.0, 56.0, 76.0, 49.0, 44.0, 48.0, 42.0, 27.0, 38.0, 28.0, 25.0, 19.0, 14.0, 12.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.51318359375, -0.4976463317871094, -0.48210906982421875, -0.4665718078613281, -0.4510345458984375, -0.4354972839355469, -0.41996002197265625, -0.4044227600097656, -0.388885498046875, -0.3733482360839844, -0.35781097412109375, -0.3422737121582031, -0.3267364501953125, -0.3111991882324219, -0.29566192626953125, -0.2801246643066406, -0.26458740234375, -0.24905014038085938, -0.23351287841796875, -0.21797561645507812, -0.2024383544921875, -0.18690109252929688, -0.17136383056640625, -0.15582656860351562, -0.140289306640625, -0.12475204467773438, -0.10921478271484375, -0.09367752075195312, -0.0781402587890625, -0.06260299682617188, -0.04706573486328125, -0.031528472900390625, -0.0159912109375, -0.000453948974609375, 0.01508331298828125, 0.030620574951171875, 0.0461578369140625, 0.061695098876953125, 0.07723236083984375, 0.09276962280273438, 0.108306884765625, 0.12384414672851562, 0.13938140869140625, 0.15491867065429688, 0.1704559326171875, 0.18599319458007812, 0.20153045654296875, 0.21706771850585938, 0.23260498046875, 0.24814224243164062, 0.26367950439453125, 0.2792167663574219, 0.2947540283203125, 0.3102912902832031, 0.32582855224609375, 0.3413658142089844, 0.356903076171875, 0.3724403381347656, 0.38797760009765625, 0.4035148620605469, 0.4190521240234375, 0.4345893859863281, 0.45012664794921875, 0.4656639099121094, 0.481201171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 13.0, 5.0, 12.0, 24.0, 28.0, 46.0, 90.0, 118.0, 246.0, 506.0, 967.0, 2353.0, 7023.0, 28116.0, 137330.0, 737686.0, 2113079.0, 940464.0, 177502.0, 34880.0, 8717.0, 2759.0, 1118.0, 534.0, 284.0, 156.0, 69.0, 57.0, 27.0, 29.0, 21.0, 7.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.421875, -1.3868331909179688, -1.3517913818359375, -1.3167495727539062, -1.281707763671875, -1.2466659545898438, -1.2116241455078125, -1.1765823364257812, -1.14154052734375, -1.1064987182617188, -1.0714569091796875, -1.0364151000976562, -1.001373291015625, -0.9663314819335938, -0.9312896728515625, -0.8962478637695312, -0.8612060546875, -0.8261642456054688, -0.7911224365234375, -0.7560806274414062, -0.721038818359375, -0.6859970092773438, -0.6509552001953125, -0.6159133911132812, -0.58087158203125, -0.5458297729492188, -0.5107879638671875, -0.47574615478515625, -0.440704345703125, -0.40566253662109375, -0.3706207275390625, -0.33557891845703125, -0.300537109375, -0.26549530029296875, -0.2304534912109375, -0.19541168212890625, -0.160369873046875, -0.12532806396484375, -0.0902862548828125, -0.05524444580078125, -0.02020263671875, 0.01483917236328125, 0.0498809814453125, 0.08492279052734375, 0.119964599609375, 0.15500640869140625, 0.1900482177734375, 0.22509002685546875, 0.2601318359375, 0.29517364501953125, 0.3302154541015625, 0.36525726318359375, 0.400299072265625, 0.43534088134765625, 0.4703826904296875, 0.5054244995117188, 0.54046630859375, 0.5755081176757812, 0.6105499267578125, 0.6455917358398438, 0.680633544921875, 0.7156753540039062, 0.7507171630859375, 0.7857589721679688, 0.82080078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 9.0, 8.0, 18.0, 15.0, 38.0, 35.0, 55.0, 73.0, 99.0, 159.0, 198.0, 239.0, 283.0, 332.0, 355.0, 397.0, 359.0, 321.0, 261.0, 228.0, 151.0, 128.0, 81.0, 71.0, 39.0, 28.0, 31.0, 20.0, 18.0, 6.0, 5.0, 2.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61962890625, -0.596099853515625, -0.57257080078125, -0.549041748046875, -0.5255126953125, -0.501983642578125, -0.47845458984375, -0.454925537109375, -0.431396484375, -0.407867431640625, -0.38433837890625, -0.360809326171875, -0.3372802734375, -0.313751220703125, -0.29022216796875, -0.266693115234375, -0.2431640625, -0.219635009765625, -0.19610595703125, -0.172576904296875, -0.1490478515625, -0.125518798828125, -0.10198974609375, -0.078460693359375, -0.054931640625, -0.031402587890625, -0.00787353515625, 0.015655517578125, 0.0391845703125, 0.062713623046875, 0.08624267578125, 0.109771728515625, 0.13330078125, 0.156829833984375, 0.18035888671875, 0.203887939453125, 0.2274169921875, 0.250946044921875, 0.27447509765625, 0.298004150390625, 0.321533203125, 0.345062255859375, 0.36859130859375, 0.392120361328125, 0.4156494140625, 0.439178466796875, 0.46270751953125, 0.486236572265625, 0.509765625, 0.533294677734375, 0.55682373046875, 0.580352783203125, 0.6038818359375, 0.627410888671875, 0.65093994140625, 0.674468994140625, 0.697998046875, 0.721527099609375, 0.74505615234375, 0.768585205078125, 0.7921142578125, 0.815643310546875, 0.83917236328125, 0.862701416015625, 0.88623046875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 25.0, 49.0, 116.0, 221.0, 258.0, 200.0, 84.0, 34.0, 12.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.779558181762695, -6.461991310119629, -6.1444244384765625, -5.826857566833496, -5.509291172027588, -5.1917243003845215, -4.874157428741455, -4.556591033935547, -4.2390241622924805, -3.921457290649414, -3.6038906574249268, -3.2863237857818604, -2.968757152557373, -2.6511902809143066, -2.3336234092712402, -2.016056776046753, -1.6984896659851074, -1.3809229135513306, -1.0633561611175537, -0.7457892894744873, -0.42822253704071045, -0.1106557846069336, 0.2069110870361328, 0.5244777202606201, 0.8420445919036865, 1.1596113443374634, 1.4771780967712402, 1.7947449684143066, 2.112311840057373, 2.4298784732818604, 2.7474453449249268, 3.065011978149414, 3.3825788497924805, 3.700145721435547, 4.017712593078613, 4.33527946472168, 4.652845859527588, 4.970412731170654, 5.287979602813721, 5.605545997619629, 5.923112869262695, 6.240679740905762, 6.558246612548828, 6.8758134841918945, 7.193379878997803, 7.510946750640869, 7.8285136222839355, 8.146080017089844, 8.463647842407227, 8.781214714050293, 9.09878158569336, 9.416348457336426, 9.733915328979492, 10.051481246948242, 10.369049072265625, 10.686614990234375, 11.004181861877441, 11.321748733520508, 11.639315605163574, 11.95688247680664, 12.274449348449707, 12.592016220092773, 12.909582138061523, 13.22714900970459, 13.544715881347656]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 5.0, 8.0, 9.0, 12.0, 14.0, 14.0, 18.0, 21.0, 28.0, 28.0, 29.0, 34.0, 41.0, 35.0, 38.0, 65.0, 43.0, 47.0, 52.0, 48.0, 45.0, 47.0, 42.0, 35.0, 25.0, 30.0, 22.0, 29.0, 23.0, 21.0, 15.0, 16.0, 16.0, 6.0, 10.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5316033363342285, -2.4514083862304688, -2.371213436126709, -2.29101824760437, -2.2108232975006104, -2.1306283473968506, -2.050433397293091, -1.9702383279800415, -1.8900432586669922, -1.8098483085632324, -1.729653239250183, -1.6494582891464233, -1.569263219833374, -1.4890682697296143, -1.4088733196258545, -1.3286782503128052, -1.2484833002090454, -1.1682883501052856, -1.0880932807922363, -1.0078983306884766, -0.9277032613754272, -0.8475083112716675, -0.7673133015632629, -0.6871182918548584, -0.6069232821464539, -0.5267282724380493, -0.4465332627296448, -0.3663382828235626, -0.2861432731151581, -0.20594826340675354, -0.1257532835006714, -0.045558273792266846, 0.034636735916137695, 0.11483173817396164, 0.19502674043178558, 0.27522173523902893, 0.35541674494743347, 0.435611754655838, 0.5158067345619202, 0.5960017442703247, 0.6761967539787292, 0.7563917636871338, 0.8365867733955383, 0.9167817831039429, 0.9969767332077026, 1.077171802520752, 1.1573667526245117, 1.2375617027282715, 1.3177567720413208, 1.3979517221450806, 1.4781467914581299, 1.5583417415618896, 1.638536810874939, 1.7187317609786987, 1.798926830291748, 1.8791217803955078, 1.9593167304992676, 2.0395116806030273, 2.119706630706787, 2.199901819229126, 2.2800967693328857, 2.3602917194366455, 2.4404866695404053, 2.520681858062744, 2.600876808166504]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 8.0, 12.0, 15.0, 19.0, 42.0, 58.0, 114.0, 269.0, 558.0, 1111.0, 2569.0, 6361.0, 15645.0, 45621.0, 159862.0, 393199.0, 290149.0, 88282.0, 27079.0, 10097.0, 4143.0, 1754.0, 770.0, 363.0, 160.0, 88.0, 59.0, 34.0, 25.0, 13.0, 13.0, 11.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7685546875, -1.7110748291015625, -1.653594970703125, -1.5961151123046875, -1.53863525390625, -1.4811553955078125, -1.423675537109375, -1.3661956787109375, -1.3087158203125, -1.2512359619140625, -1.193756103515625, -1.1362762451171875, -1.07879638671875, -1.0213165283203125, -0.963836669921875, -0.9063568115234375, -0.848876953125, -0.7913970947265625, -0.733917236328125, -0.6764373779296875, -0.61895751953125, -0.5614776611328125, -0.503997802734375, -0.4465179443359375, -0.3890380859375, -0.3315582275390625, -0.274078369140625, -0.2165985107421875, -0.15911865234375, -0.1016387939453125, -0.044158935546875, 0.0133209228515625, 0.07080078125, 0.1282806396484375, 0.185760498046875, 0.2432403564453125, 0.30072021484375, 0.3582000732421875, 0.415679931640625, 0.4731597900390625, 0.5306396484375, 0.5881195068359375, 0.645599365234375, 0.7030792236328125, 0.76055908203125, 0.8180389404296875, 0.875518798828125, 0.9329986572265625, 0.990478515625, 1.0479583740234375, 1.105438232421875, 1.1629180908203125, 1.22039794921875, 1.2778778076171875, 1.335357666015625, 1.3928375244140625, 1.4503173828125, 1.5077972412109375, 1.565277099609375, 1.6227569580078125, 1.68023681640625, 1.7377166748046875, 1.795196533203125, 1.8526763916015625, 1.91015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 4.0, 13.0, 13.0, 19.0, 18.0, 26.0, 38.0, 46.0, 42.0, 56.0, 73.0, 55.0, 68.0, 79.0, 84.0, 75.0, 61.0, 47.0, 42.0, 37.0, 34.0, 20.0, 15.0, 10.0, 10.0, 7.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7109375, -0.6917800903320312, -0.6726226806640625, -0.6534652709960938, -0.634307861328125, -0.6151504516601562, -0.5959930419921875, -0.5768356323242188, -0.55767822265625, -0.5385208129882812, -0.5193634033203125, -0.5002059936523438, -0.481048583984375, -0.46189117431640625, -0.4427337646484375, -0.42357635498046875, -0.4044189453125, -0.38526153564453125, -0.3661041259765625, -0.34694671630859375, -0.327789306640625, -0.30863189697265625, -0.2894744873046875, -0.27031707763671875, -0.25115966796875, -0.23200225830078125, -0.2128448486328125, -0.19368743896484375, -0.174530029296875, -0.15537261962890625, -0.1362152099609375, -0.11705780029296875, -0.097900390625, -0.07874298095703125, -0.0595855712890625, -0.04042816162109375, -0.021270751953125, -0.00211334228515625, 0.0170440673828125, 0.03620147705078125, 0.05535888671875, 0.07451629638671875, 0.0936737060546875, 0.11283111572265625, 0.131988525390625, 0.15114593505859375, 0.1703033447265625, 0.18946075439453125, 0.2086181640625, 0.22777557373046875, 0.2469329833984375, 0.26609039306640625, 0.285247802734375, 0.30440521240234375, 0.3235626220703125, 0.34272003173828125, 0.36187744140625, 0.38103485107421875, 0.4001922607421875, 0.41934967041015625, 0.438507080078125, 0.45766448974609375, 0.4768218994140625, 0.49597930908203125, 0.51513671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 1.0, 6.0, 10.0, 16.0, 21.0, 24.0, 46.0, 71.0, 98.0, 111.0, 181.0, 277.0, 457.0, 808.0, 1397.0, 2646.0, 4919.0, 9654.0, 19627.0, 39174.0, 80513.0, 149826.0, 219867.0, 218039.0, 146309.0, 77597.0, 37982.0, 18739.0, 9240.0, 4869.0, 2573.0, 1361.0, 746.0, 451.0, 299.0, 188.0, 127.0, 95.0, 54.0, 42.0, 29.0, 26.0, 13.0, 14.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.95654296875, -0.9266281127929688, -0.8967132568359375, -0.8667984008789062, -0.836883544921875, -0.8069686889648438, -0.7770538330078125, -0.7471389770507812, -0.71722412109375, -0.6873092651367188, -0.6573944091796875, -0.6274795532226562, -0.597564697265625, -0.5676498413085938, -0.5377349853515625, -0.5078201293945312, -0.4779052734375, -0.44799041748046875, -0.4180755615234375, -0.38816070556640625, -0.358245849609375, -0.32833099365234375, -0.2984161376953125, -0.26850128173828125, -0.23858642578125, -0.20867156982421875, -0.1787567138671875, -0.14884185791015625, -0.118927001953125, -0.08901214599609375, -0.0590972900390625, -0.02918243408203125, 0.000732421875, 0.03064727783203125, 0.0605621337890625, 0.09047698974609375, 0.120391845703125, 0.15030670166015625, 0.1802215576171875, 0.21013641357421875, 0.24005126953125, 0.26996612548828125, 0.2998809814453125, 0.32979583740234375, 0.359710693359375, 0.38962554931640625, 0.4195404052734375, 0.44945526123046875, 0.4793701171875, 0.5092849731445312, 0.5391998291015625, 0.5691146850585938, 0.599029541015625, 0.6289443969726562, 0.6588592529296875, 0.6887741088867188, 0.71868896484375, 0.7486038208007812, 0.7785186767578125, 0.8084335327148438, 0.838348388671875, 0.8682632446289062, 0.8981781005859375, 0.9280929565429688, 0.9580078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 7.0, 14.0, 14.0, 15.0, 21.0, 27.0, 25.0, 31.0, 36.0, 32.0, 35.0, 49.0, 41.0, 49.0, 50.0, 40.0, 42.0, 32.0, 45.0, 45.0, 41.0, 34.0, 35.0, 42.0, 28.0, 34.0, 16.0, 21.0, 16.0, 16.0, 8.0, 10.0, 4.0, 5.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1123046875, -1.0794906616210938, -1.0466766357421875, -1.0138626098632812, -0.981048583984375, -0.9482345581054688, -0.9154205322265625, -0.8826065063476562, -0.84979248046875, -0.8169784545898438, -0.7841644287109375, -0.7513504028320312, -0.718536376953125, -0.6857223510742188, -0.6529083251953125, -0.6200942993164062, -0.5872802734375, -0.5544662475585938, -0.5216522216796875, -0.48883819580078125, -0.456024169921875, -0.42321014404296875, -0.3903961181640625, -0.35758209228515625, -0.32476806640625, -0.29195404052734375, -0.2591400146484375, -0.22632598876953125, -0.193511962890625, -0.16069793701171875, -0.1278839111328125, -0.09506988525390625, -0.062255859375, -0.02944183349609375, 0.0033721923828125, 0.03618621826171875, 0.069000244140625, 0.10181427001953125, 0.1346282958984375, 0.16744232177734375, 0.20025634765625, 0.23307037353515625, 0.2658843994140625, 0.29869842529296875, 0.331512451171875, 0.36432647705078125, 0.3971405029296875, 0.42995452880859375, 0.4627685546875, 0.49558258056640625, 0.5283966064453125, 0.5612106323242188, 0.594024658203125, 0.6268386840820312, 0.6596527099609375, 0.6924667358398438, 0.72528076171875, 0.7580947875976562, 0.7909088134765625, 0.8237228393554688, 0.856536865234375, 0.8893508911132812, 0.9221649169921875, 0.9549789428710938, 0.98779296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 6.0, 13.0, 23.0, 35.0, 55.0, 101.0, 172.0, 339.0, 553.0, 1076.0, 1974.0, 4392.0, 10150.0, 24976.0, 64860.0, 152992.0, 268912.0, 265493.0, 148350.0, 61739.0, 24286.0, 9710.0, 4131.0, 1966.0, 958.0, 529.0, 340.0, 159.0, 135.0, 39.0, 37.0, 17.0, 11.0, 13.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48095703125, -0.46543121337890625, -0.4499053955078125, -0.43437957763671875, -0.418853759765625, -0.40332794189453125, -0.3878021240234375, -0.37227630615234375, -0.35675048828125, -0.34122467041015625, -0.3256988525390625, -0.31017303466796875, -0.294647216796875, -0.27912139892578125, -0.2635955810546875, -0.24806976318359375, -0.2325439453125, -0.21701812744140625, -0.2014923095703125, -0.18596649169921875, -0.170440673828125, -0.15491485595703125, -0.1393890380859375, -0.12386322021484375, -0.10833740234375, -0.09281158447265625, -0.0772857666015625, -0.06175994873046875, -0.046234130859375, -0.03070831298828125, -0.0151824951171875, 0.00034332275390625, 0.015869140625, 0.03139495849609375, 0.0469207763671875, 0.06244659423828125, 0.077972412109375, 0.09349822998046875, 0.1090240478515625, 0.12454986572265625, 0.14007568359375, 0.15560150146484375, 0.1711273193359375, 0.18665313720703125, 0.202178955078125, 0.21770477294921875, 0.2332305908203125, 0.24875640869140625, 0.2642822265625, 0.27980804443359375, 0.2953338623046875, 0.31085968017578125, 0.326385498046875, 0.34191131591796875, 0.3574371337890625, 0.37296295166015625, 0.38848876953125, 0.40401458740234375, 0.4195404052734375, 0.43506622314453125, 0.450592041015625, 0.46611785888671875, 0.4816436767578125, 0.49716949462890625, 0.5126953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 4.0, 9.0, 10.0, 6.0, 18.0, 13.0, 17.0, 34.0, 33.0, 47.0, 55.0, 49.0, 71.0, 61.0, 76.0, 80.0, 66.0, 65.0, 51.0, 42.0, 45.0, 21.0, 23.0, 18.0, 15.0, 9.0, 15.0, 6.0, 7.0, 5.0, 8.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.61015510559082e-05, -6.381981074810028e-05, -6.153807044029236e-05, -5.9256330132484436e-05, -5.6974589824676514e-05, -5.469284951686859e-05, -5.241110920906067e-05, -5.0129368901252747e-05, -4.7847628593444824e-05, -4.55658882856369e-05, -4.328414797782898e-05, -4.100240767002106e-05, -3.8720667362213135e-05, -3.643892705440521e-05, -3.415718674659729e-05, -3.187544643878937e-05, -2.9593706130981445e-05, -2.7311965823173523e-05, -2.50302255153656e-05, -2.2748485207557678e-05, -2.0466744899749756e-05, -1.8185004591941833e-05, -1.590326428413391e-05, -1.3621523976325989e-05, -1.1339783668518066e-05, -9.058043360710144e-06, -6.776303052902222e-06, -4.494562745094299e-06, -2.212822437286377e-06, 6.891787052154541e-08, 2.3506581783294678e-06, 4.63239848613739e-06, 6.9141387939453125e-06, 9.195879101753235e-06, 1.1477619409561157e-05, 1.375935971736908e-05, 1.6041100025177002e-05, 1.8322840332984924e-05, 2.0604580640792847e-05, 2.288632094860077e-05, 2.516806125640869e-05, 2.7449801564216614e-05, 2.9731541872024536e-05, 3.201328217983246e-05, 3.429502248764038e-05, 3.65767627954483e-05, 3.8858503103256226e-05, 4.114024341106415e-05, 4.342198371887207e-05, 4.570372402667999e-05, 4.7985464334487915e-05, 5.026720464229584e-05, 5.254894495010376e-05, 5.483068525791168e-05, 5.7112425565719604e-05, 5.939416587352753e-05, 6.167590618133545e-05, 6.395764648914337e-05, 6.62393867969513e-05, 6.852112710475922e-05, 7.080286741256714e-05, 7.308460772037506e-05, 7.536634802818298e-05, 7.76480883359909e-05, 7.992982864379883e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 8.0, 13.0, 15.0, 30.0, 47.0, 54.0, 104.0, 172.0, 250.0, 444.0, 843.0, 1565.0, 3311.0, 7474.0, 17089.0, 40477.0, 94874.0, 191147.0, 265943.0, 217833.0, 116078.0, 51725.0, 21600.0, 9322.0, 4061.0, 1832.0, 974.0, 504.0, 307.0, 172.0, 108.0, 58.0, 47.0, 29.0, 20.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.5, -0.4867134094238281, -0.47342681884765625, -0.4601402282714844, -0.4468536376953125, -0.4335670471191406, -0.42028045654296875, -0.4069938659667969, -0.393707275390625, -0.3804206848144531, -0.36713409423828125, -0.3538475036621094, -0.3405609130859375, -0.3272743225097656, -0.31398773193359375, -0.3007011413574219, -0.28741455078125, -0.2741279602050781, -0.26084136962890625, -0.24755477905273438, -0.2342681884765625, -0.22098159790039062, -0.20769500732421875, -0.19440841674804688, -0.181121826171875, -0.16783523559570312, -0.15454864501953125, -0.14126205444335938, -0.1279754638671875, -0.11468887329101562, -0.10140228271484375, -0.08811569213867188, -0.0748291015625, -0.061542510986328125, -0.04825592041015625, -0.034969329833984375, -0.0216827392578125, -0.008396148681640625, 0.00489044189453125, 0.018177032470703125, 0.031463623046875, 0.044750213623046875, 0.05803680419921875, 0.07132339477539062, 0.0846099853515625, 0.09789657592773438, 0.11118316650390625, 0.12446975708007812, 0.13775634765625, 0.15104293823242188, 0.16432952880859375, 0.17761611938476562, 0.1909027099609375, 0.20418930053710938, 0.21747589111328125, 0.23076248168945312, 0.244049072265625, 0.2573356628417969, 0.27062225341796875, 0.2839088439941406, 0.2971954345703125, 0.3104820251464844, 0.32376861572265625, 0.3370552062988281, 0.350341796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 4.0, 10.0, 10.0, 8.0, 14.0, 13.0, 16.0, 23.0, 24.0, 37.0, 38.0, 41.0, 44.0, 48.0, 61.0, 64.0, 81.0, 56.0, 59.0, 47.0, 38.0, 36.0, 36.0, 25.0, 24.0, 29.0, 21.0, 23.0, 16.0, 15.0, 7.0, 4.0, 6.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.321044921875, -0.3105010986328125, -0.299957275390625, -0.2894134521484375, -0.27886962890625, -0.2683258056640625, -0.257781982421875, -0.2472381591796875, -0.2366943359375, -0.2261505126953125, -0.215606689453125, -0.2050628662109375, -0.19451904296875, -0.1839752197265625, -0.173431396484375, -0.1628875732421875, -0.15234375, -0.1417999267578125, -0.131256103515625, -0.1207122802734375, -0.11016845703125, -0.0996246337890625, -0.089080810546875, -0.0785369873046875, -0.0679931640625, -0.0574493408203125, -0.046905517578125, -0.0363616943359375, -0.02581787109375, -0.0152740478515625, -0.004730224609375, 0.0058135986328125, 0.016357421875, 0.0269012451171875, 0.037445068359375, 0.0479888916015625, 0.05853271484375, 0.0690765380859375, 0.079620361328125, 0.0901641845703125, 0.1007080078125, 0.1112518310546875, 0.121795654296875, 0.1323394775390625, 0.14288330078125, 0.1534271240234375, 0.163970947265625, 0.1745147705078125, 0.18505859375, 0.1956024169921875, 0.206146240234375, 0.2166900634765625, 0.22723388671875, 0.2377777099609375, 0.248321533203125, 0.2588653564453125, 0.2694091796875, 0.2799530029296875, 0.290496826171875, 0.3010406494140625, 0.31158447265625, 0.3221282958984375, 0.332672119140625, 0.3432159423828125, 0.353759765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 11.0, 11.0, 21.0, 32.0, 32.0, 49.0, 45.0, 59.0, 67.0, 80.0, 83.0, 78.0, 69.0, 61.0, 54.0, 45.0, 53.0, 35.0, 25.0, 19.0, 16.0, 11.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62399959564209, -2.5225133895874023, -2.4210269451141357, -2.3195407390594482, -2.2180545330047607, -2.116568088531494, -2.0150818824768066, -1.9135956764221191, -1.812109351158142, -1.710623025894165, -1.6091368198394775, -1.5076504945755005, -1.4061641693115234, -1.304677963256836, -1.2031916379928589, -1.1017053127288818, -1.0002191066741943, -0.8987328410148621, -0.7972465753555298, -0.6957602500915527, -0.5942739844322205, -0.4927877187728882, -0.39130139350891113, -0.28981512784957886, -0.18832886219024658, -0.08684258162975311, 0.014643698930740356, 0.11612999439239502, 0.2176162600517273, 0.31910252571105957, 0.4205888509750366, 0.5220751166343689, 0.6235613822937012, 0.7250476479530334, 0.8265339136123657, 0.9280202388763428, 1.0295064449310303, 1.1309927701950073, 1.2324790954589844, 1.3339653015136719, 1.435451626777649, 1.536937952041626, 1.6384241580963135, 1.7399104833602905, 1.8413968086242676, 1.942883014678955, 2.0443692207336426, 2.145855665206909, 2.2473418712615967, 2.348828077316284, 2.450314521789551, 2.5518007278442383, 2.653286933898926, 2.7547731399536133, 2.85625958442688, 2.9577457904815674, 3.059232234954834, 3.1607184410095215, 3.262204885482788, 3.3636910915374756, 3.465177297592163, 3.5666637420654297, 3.668149948120117, 3.7696361541748047, 3.871122360229492]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 9.0, 11.0, 5.0, 12.0, 11.0, 10.0, 19.0, 21.0, 16.0, 31.0, 29.0, 28.0, 47.0, 32.0, 47.0, 36.0, 39.0, 32.0, 37.0, 49.0, 31.0, 46.0, 38.0, 47.0, 42.0, 35.0, 26.0, 22.0, 27.0, 26.0, 29.0, 20.0, 7.0, 12.0, 11.0, 11.0, 9.0, 3.0, 6.0, 7.0, 4.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.8946542739868164, -2.8066117763519287, -2.718569278717041, -2.6305267810821533, -2.5424842834472656, -2.454441785812378, -2.3663992881774902, -2.2783567905426025, -2.190314292907715, -2.102271795272827, -2.0142292976379395, -1.9261868000030518, -1.838144302368164, -1.7501018047332764, -1.6620593070983887, -1.574016809463501, -1.4859743118286133, -1.3979318141937256, -1.309889316558838, -1.2218468189239502, -1.1338043212890625, -1.0457618236541748, -0.9577193260192871, -0.8696768283843994, -0.7816343307495117, -0.693591833114624, -0.6055493354797363, -0.5175068378448486, -0.42946434020996094, -0.34142184257507324, -0.25337934494018555, -0.16533684730529785, -0.07729458808898926, 0.010747909545898438, 0.09879040718078613, 0.18683290481567383, 0.2748754024505615, 0.3629179000854492, 0.4509603977203369, 0.5390028953552246, 0.6270453929901123, 0.715087890625, 0.8031303882598877, 0.8911728858947754, 0.9792153835296631, 1.0672578811645508, 1.1553003787994385, 1.2433428764343262, 1.3313853740692139, 1.4194278717041016, 1.5074703693389893, 1.595512866973877, 1.6835553646087646, 1.7715978622436523, 1.85964035987854, 1.9476828575134277, 2.0357253551483154, 2.123767852783203, 2.211810350418091, 2.2998528480529785, 2.387895345687866, 2.475937843322754, 2.5639803409576416, 2.6520228385925293, 2.740065336227417]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 9.0, 13.0, 15.0, 29.0, 19.0, 28.0, 52.0, 76.0, 157.0, 222.0, 408.0, 801.0, 1682.0, 4080.0, 10821.0, 32494.0, 113935.0, 498345.0, 1829978.0, 1307707.0, 286802.0, 71437.0, 21689.0, 7678.0, 3004.0, 1344.0, 655.0, 328.0, 188.0, 104.0, 63.0, 42.0, 23.0, 18.0, 8.0, 7.0, 6.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92626953125, -0.9017791748046875, -0.877288818359375, -0.8527984619140625, -0.82830810546875, -0.8038177490234375, -0.779327392578125, -0.7548370361328125, -0.7303466796875, -0.7058563232421875, -0.681365966796875, -0.6568756103515625, -0.63238525390625, -0.6078948974609375, -0.583404541015625, -0.5589141845703125, -0.534423828125, -0.5099334716796875, -0.485443115234375, -0.4609527587890625, -0.43646240234375, -0.4119720458984375, -0.387481689453125, -0.3629913330078125, -0.3385009765625, -0.3140106201171875, -0.289520263671875, -0.2650299072265625, -0.24053955078125, -0.2160491943359375, -0.191558837890625, -0.1670684814453125, -0.142578125, -0.1180877685546875, -0.093597412109375, -0.0691070556640625, -0.04461669921875, -0.0201263427734375, 0.004364013671875, 0.0288543701171875, 0.0533447265625, 0.0778350830078125, 0.102325439453125, 0.1268157958984375, 0.15130615234375, 0.1757965087890625, 0.200286865234375, 0.2247772216796875, 0.249267578125, 0.2737579345703125, 0.298248291015625, 0.3227386474609375, 0.34722900390625, 0.3717193603515625, 0.396209716796875, 0.4207000732421875, 0.4451904296875, 0.4696807861328125, 0.494171142578125, 0.5186614990234375, 0.54315185546875, 0.5676422119140625, 0.592132568359375, 0.6166229248046875, 0.64111328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 14.0, 12.0, 24.0, 24.0, 22.0, 26.0, 25.0, 32.0, 49.0, 43.0, 63.0, 67.0, 53.0, 53.0, 56.0, 60.0, 57.0, 48.0, 44.0, 37.0, 39.0, 38.0, 27.0, 16.0, 17.0, 11.0, 10.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55078125, -0.5349044799804688, -0.5190277099609375, -0.5031509399414062, -0.487274169921875, -0.47139739990234375, -0.4555206298828125, -0.43964385986328125, -0.42376708984375, -0.40789031982421875, -0.3920135498046875, -0.37613677978515625, -0.360260009765625, -0.34438323974609375, -0.3285064697265625, -0.31262969970703125, -0.2967529296875, -0.28087615966796875, -0.2649993896484375, -0.24912261962890625, -0.233245849609375, -0.21736907958984375, -0.2014923095703125, -0.18561553955078125, -0.16973876953125, -0.15386199951171875, -0.1379852294921875, -0.12210845947265625, -0.106231689453125, -0.09035491943359375, -0.0744781494140625, -0.05860137939453125, -0.042724609375, -0.02684783935546875, -0.0109710693359375, 0.00490570068359375, 0.020782470703125, 0.03665924072265625, 0.0525360107421875, 0.06841278076171875, 0.08428955078125, 0.10016632080078125, 0.1160430908203125, 0.13191986083984375, 0.147796630859375, 0.16367340087890625, 0.1795501708984375, 0.19542694091796875, 0.2113037109375, 0.22718048095703125, 0.2430572509765625, 0.25893402099609375, 0.274810791015625, 0.29068756103515625, 0.3065643310546875, 0.32244110107421875, 0.33831787109375, 0.35419464111328125, 0.3700714111328125, 0.38594818115234375, 0.401824951171875, 0.41770172119140625, 0.4335784912109375, 0.44945526123046875, 0.46533203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 12.0, 11.0, 30.0, 39.0, 68.0, 86.0, 157.0, 322.0, 719.0, 2073.0, 8033.0, 39754.0, 265349.0, 1743912.0, 1802255.0, 277872.0, 41617.0, 8178.0, 2206.0, 803.0, 311.0, 151.0, 100.0, 72.0, 42.0, 33.0, 11.0, 15.0, 6.0, 10.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.291015625, -1.2506866455078125, -1.210357666015625, -1.1700286865234375, -1.12969970703125, -1.0893707275390625, -1.049041748046875, -1.0087127685546875, -0.9683837890625, -0.9280548095703125, -0.887725830078125, -0.8473968505859375, -0.80706787109375, -0.7667388916015625, -0.726409912109375, -0.6860809326171875, -0.645751953125, -0.6054229736328125, -0.565093994140625, -0.5247650146484375, -0.48443603515625, -0.4441070556640625, -0.403778076171875, -0.3634490966796875, -0.3231201171875, -0.2827911376953125, -0.242462158203125, -0.2021331787109375, -0.16180419921875, -0.1214752197265625, -0.081146240234375, -0.0408172607421875, -0.00048828125, 0.0398406982421875, 0.080169677734375, 0.1204986572265625, 0.16082763671875, 0.2011566162109375, 0.241485595703125, 0.2818145751953125, 0.3221435546875, 0.3624725341796875, 0.402801513671875, 0.4431304931640625, 0.48345947265625, 0.5237884521484375, 0.564117431640625, 0.6044464111328125, 0.644775390625, 0.6851043701171875, 0.725433349609375, 0.7657623291015625, 0.80609130859375, 0.8464202880859375, 0.886749267578125, 0.9270782470703125, 0.9674072265625, 1.0077362060546875, 1.048065185546875, 1.0883941650390625, 1.12872314453125, 1.1690521240234375, 1.209381103515625, 1.2497100830078125, 1.2900390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 10.0, 11.0, 9.0, 22.0, 28.0, 44.0, 49.0, 59.0, 86.0, 92.0, 118.0, 148.0, 162.0, 243.0, 300.0, 313.0, 378.0, 335.0, 294.0, 291.0, 263.0, 201.0, 139.0, 114.0, 84.0, 56.0, 52.0, 41.0, 32.0, 19.0, 21.0, 11.0, 11.0, 9.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.673828125, -0.653900146484375, -0.63397216796875, -0.614044189453125, -0.5941162109375, -0.574188232421875, -0.55426025390625, -0.534332275390625, -0.514404296875, -0.494476318359375, -0.47454833984375, -0.454620361328125, -0.4346923828125, -0.414764404296875, -0.39483642578125, -0.374908447265625, -0.35498046875, -0.335052490234375, -0.31512451171875, -0.295196533203125, -0.2752685546875, -0.255340576171875, -0.23541259765625, -0.215484619140625, -0.195556640625, -0.175628662109375, -0.15570068359375, -0.135772705078125, -0.1158447265625, -0.095916748046875, -0.07598876953125, -0.056060791015625, -0.0361328125, -0.016204833984375, 0.00372314453125, 0.023651123046875, 0.0435791015625, 0.063507080078125, 0.08343505859375, 0.103363037109375, 0.123291015625, 0.143218994140625, 0.16314697265625, 0.183074951171875, 0.2030029296875, 0.222930908203125, 0.24285888671875, 0.262786865234375, 0.28271484375, 0.302642822265625, 0.32257080078125, 0.342498779296875, 0.3624267578125, 0.382354736328125, 0.40228271484375, 0.422210693359375, 0.442138671875, 0.462066650390625, 0.48199462890625, 0.501922607421875, 0.5218505859375, 0.541778564453125, 0.56170654296875, 0.581634521484375, 0.6015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 9.0, 7.0, 18.0, 39.0, 53.0, 70.0, 95.0, 121.0, 137.0, 128.0, 112.0, 100.0, 54.0, 33.0, 23.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.6520538330078125, -7.473014831542969, -7.293975830078125, -7.114936828613281, -6.9358978271484375, -6.756858825683594, -6.57781982421875, -6.398780822753906, -6.2197418212890625, -6.040702819824219, -5.861663818359375, -5.682624816894531, -5.5035858154296875, -5.324546813964844, -5.1455078125, -4.966468811035156, -4.7874298095703125, -4.608390808105469, -4.429351806640625, -4.250312805175781, -4.0712738037109375, -3.8922348022460938, -3.71319580078125, -3.5341567993164062, -3.3551173210144043, -3.1760783195495605, -2.997039318084717, -2.818000316619873, -2.6389613151550293, -2.4599223136901855, -2.280883312225342, -2.101844310760498, -1.9228055477142334, -1.7437665462493896, -1.564727544784546, -1.3856885433197021, -1.2066495418548584, -1.0276105403900146, -0.8485714197158813, -0.6695324182510376, -0.49049341678619385, -0.3114544153213501, -0.13241538405418396, 0.04662364721298218, 0.22566264867782593, 0.4047016501426697, 0.5837407112121582, 0.762779712677002, 0.9418187141418457, 1.1208577156066895, 1.2998967170715332, 1.478935718536377, 1.6579747200012207, 1.8370137214660645, 2.016052722930908, 2.195091724395752, 2.3741307258605957, 2.5531697273254395, 2.732208728790283, 2.911247730255127, 3.0902867317199707, 3.2693257331848145, 3.448364734649658, 3.627403736114502, 3.806442975997925]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 6.0, 12.0, 16.0, 18.0, 23.0, 24.0, 25.0, 30.0, 27.0, 38.0, 36.0, 41.0, 28.0, 46.0, 39.0, 41.0, 40.0, 45.0, 34.0, 42.0, 31.0, 35.0, 32.0, 36.0, 36.0, 21.0, 26.0, 23.0, 18.0, 17.0, 19.0, 12.0, 6.0, 13.0, 7.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.2632663249969482, -2.1969923973083496, -2.130718231201172, -2.0644443035125732, -1.9981701374053955, -1.9318960905075073, -1.8656220436096191, -1.7993481159210205, -1.7330739498138428, -1.6667999029159546, -1.6005258560180664, -1.5342518091201782, -1.46797776222229, -1.4017037153244019, -1.3354296684265137, -1.269155740737915, -1.2028816938400269, -1.1366076469421387, -1.0703336000442505, -1.0040595531463623, -0.9377855062484741, -0.8715114593505859, -0.8052374720573425, -0.7389634251594543, -0.6726893782615662, -0.606415331363678, -0.5401412844657898, -0.473867267370224, -0.4075932204723358, -0.34131917357444763, -0.27504515647888184, -0.20877110958099365, -0.14249706268310547, -0.07622302323579788, -0.009948983788490295, 0.056325048208236694, 0.12259909510612488, 0.18887314200401306, 0.25514715909957886, 0.32142120599746704, 0.3876952528953552, 0.4539692997932434, 0.5202433466911316, 0.586517333984375, 0.6527913808822632, 0.7190654277801514, 0.7853394746780396, 0.8516135215759277, 0.9178875684738159, 0.9841616153717041, 1.0504356622695923, 1.1167097091674805, 1.1829837560653687, 1.2492578029632568, 1.3155317306518555, 1.3818058967590332, 1.4480798244476318, 1.51435387134552, 1.5806279182434082, 1.6469019651412964, 1.7131760120391846, 1.7794500589370728, 1.845724105834961, 1.9119980335235596, 1.9782721996307373]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 14.0, 15.0, 19.0, 34.0, 52.0, 58.0, 101.0, 196.0, 339.0, 708.0, 1502.0, 3284.0, 7733.0, 18639.0, 45149.0, 109971.0, 241080.0, 306035.0, 181803.0, 77164.0, 31631.0, 13074.0, 5351.0, 2353.0, 1028.0, 513.0, 298.0, 146.0, 90.0, 51.0, 33.0, 24.0, 21.0, 11.0, 8.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.234375, -1.193634033203125, -1.15289306640625, -1.112152099609375, -1.0714111328125, -1.030670166015625, -0.98992919921875, -0.949188232421875, -0.908447265625, -0.867706298828125, -0.82696533203125, -0.786224365234375, -0.7454833984375, -0.704742431640625, -0.66400146484375, -0.623260498046875, -0.58251953125, -0.541778564453125, -0.50103759765625, -0.460296630859375, -0.4195556640625, -0.378814697265625, -0.33807373046875, -0.297332763671875, -0.256591796875, -0.215850830078125, -0.17510986328125, -0.134368896484375, -0.0936279296875, -0.052886962890625, -0.01214599609375, 0.028594970703125, 0.0693359375, 0.110076904296875, 0.15081787109375, 0.191558837890625, 0.2322998046875, 0.273040771484375, 0.31378173828125, 0.354522705078125, 0.395263671875, 0.436004638671875, 0.47674560546875, 0.517486572265625, 0.5582275390625, 0.598968505859375, 0.63970947265625, 0.680450439453125, 0.72119140625, 0.761932373046875, 0.80267333984375, 0.843414306640625, 0.8841552734375, 0.924896240234375, 0.96563720703125, 1.006378173828125, 1.047119140625, 1.087860107421875, 1.12860107421875, 1.169342041015625, 1.2100830078125, 1.250823974609375, 1.29156494140625, 1.332305908203125, 1.373046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 8.0, 5.0, 13.0, 12.0, 21.0, 21.0, 21.0, 31.0, 40.0, 34.0, 48.0, 47.0, 54.0, 59.0, 64.0, 61.0, 44.0, 62.0, 48.0, 61.0, 43.0, 27.0, 29.0, 30.0, 29.0, 28.0, 15.0, 4.0, 9.0, 8.0, 8.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5252456665039062, -0.5099639892578125, -0.49468231201171875, -0.479400634765625, -0.46411895751953125, -0.4488372802734375, -0.43355560302734375, -0.41827392578125, -0.40299224853515625, -0.3877105712890625, -0.37242889404296875, -0.357147216796875, -0.34186553955078125, -0.3265838623046875, -0.31130218505859375, -0.2960205078125, -0.28073883056640625, -0.2654571533203125, -0.25017547607421875, -0.234893798828125, -0.21961212158203125, -0.2043304443359375, -0.18904876708984375, -0.17376708984375, -0.15848541259765625, -0.1432037353515625, -0.12792205810546875, -0.112640380859375, -0.09735870361328125, -0.0820770263671875, -0.06679534912109375, -0.051513671875, -0.03623199462890625, -0.0209503173828125, -0.00566864013671875, 0.009613037109375, 0.02489471435546875, 0.0401763916015625, 0.05545806884765625, 0.07073974609375, 0.08602142333984375, 0.1013031005859375, 0.11658477783203125, 0.131866455078125, 0.14714813232421875, 0.1624298095703125, 0.17771148681640625, 0.1929931640625, 0.20827484130859375, 0.2235565185546875, 0.23883819580078125, 0.254119873046875, 0.26940155029296875, 0.2846832275390625, 0.29996490478515625, 0.31524658203125, 0.33052825927734375, 0.3458099365234375, 0.36109161376953125, 0.376373291015625, 0.39165496826171875, 0.4069366455078125, 0.42221832275390625, 0.4375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 10.0, 6.0, 9.0, 7.0, 10.0, 17.0, 22.0, 36.0, 56.0, 112.0, 221.0, 449.0, 1174.0, 2768.0, 6599.0, 15448.0, 35676.0, 79341.0, 163264.0, 258986.0, 237325.0, 135000.0, 63086.0, 28110.0, 11878.0, 5102.0, 2109.0, 883.0, 370.0, 176.0, 95.0, 58.0, 31.0, 22.0, 14.0, 13.0, 13.0, 12.0, 6.0, 6.0, 6.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.162109375, -1.1256256103515625, -1.089141845703125, -1.0526580810546875, -1.01617431640625, -0.9796905517578125, -0.943206787109375, -0.9067230224609375, -0.8702392578125, -0.8337554931640625, -0.797271728515625, -0.7607879638671875, -0.72430419921875, -0.6878204345703125, -0.651336669921875, -0.6148529052734375, -0.578369140625, -0.5418853759765625, -0.505401611328125, -0.4689178466796875, -0.43243408203125, -0.3959503173828125, -0.359466552734375, -0.3229827880859375, -0.2864990234375, -0.2500152587890625, -0.213531494140625, -0.1770477294921875, -0.14056396484375, -0.1040802001953125, -0.067596435546875, -0.0311126708984375, 0.00537109375, 0.0418548583984375, 0.078338623046875, 0.1148223876953125, 0.15130615234375, 0.1877899169921875, 0.224273681640625, 0.2607574462890625, 0.2972412109375, 0.3337249755859375, 0.370208740234375, 0.4066925048828125, 0.44317626953125, 0.4796600341796875, 0.516143798828125, 0.5526275634765625, 0.589111328125, 0.6255950927734375, 0.662078857421875, 0.6985626220703125, 0.73504638671875, 0.7715301513671875, 0.808013916015625, 0.8444976806640625, 0.8809814453125, 0.9174652099609375, 0.953948974609375, 0.9904327392578125, 1.02691650390625, 1.0634002685546875, 1.099884033203125, 1.1363677978515625, 1.1728515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 4.0, 6.0, 8.0, 10.0, 15.0, 8.0, 11.0, 10.0, 19.0, 21.0, 18.0, 26.0, 23.0, 34.0, 42.0, 33.0, 43.0, 50.0, 36.0, 59.0, 43.0, 43.0, 45.0, 41.0, 33.0, 47.0, 42.0, 34.0, 25.0, 34.0, 17.0, 10.0, 23.0, 16.0, 13.0, 9.0, 9.0, 11.0, 4.0, 4.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0195770263671875, -0.986419677734375, -0.9532623291015625, -0.92010498046875, -0.8869476318359375, -0.853790283203125, -0.8206329345703125, -0.7874755859375, -0.7543182373046875, -0.721160888671875, -0.6880035400390625, -0.65484619140625, -0.6216888427734375, -0.588531494140625, -0.5553741455078125, -0.522216796875, -0.4890594482421875, -0.455902099609375, -0.4227447509765625, -0.38958740234375, -0.3564300537109375, -0.323272705078125, -0.2901153564453125, -0.2569580078125, -0.2238006591796875, -0.190643310546875, -0.1574859619140625, -0.12432861328125, -0.0911712646484375, -0.058013916015625, -0.0248565673828125, 0.00830078125, 0.0414581298828125, 0.074615478515625, 0.1077728271484375, 0.14093017578125, 0.1740875244140625, 0.207244873046875, 0.2404022216796875, 0.2735595703125, 0.3067169189453125, 0.339874267578125, 0.3730316162109375, 0.40618896484375, 0.4393463134765625, 0.472503662109375, 0.5056610107421875, 0.538818359375, 0.5719757080078125, 0.605133056640625, 0.6382904052734375, 0.67144775390625, 0.7046051025390625, 0.737762451171875, 0.7709197998046875, 0.8040771484375, 0.8372344970703125, 0.870391845703125, 0.9035491943359375, 0.93670654296875, 0.9698638916015625, 1.003021240234375, 1.0361785888671875, 1.0693359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 14.0, 7.0, 22.0, 48.0, 43.0, 68.0, 109.0, 154.0, 244.0, 373.0, 584.0, 925.0, 1629.0, 2526.0, 4401.0, 7889.0, 14806.0, 27719.0, 50989.0, 88406.0, 136266.0, 174265.0, 177530.0, 142663.0, 94670.0, 55361.0, 30290.0, 15979.0, 8620.0, 4753.0, 2795.0, 1566.0, 999.0, 610.0, 439.0, 285.0, 179.0, 102.0, 77.0, 42.0, 31.0, 16.0, 20.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0], "bins": [-0.309814453125, -0.30072021484375, -0.2916259765625, -0.28253173828125, -0.2734375, -0.26434326171875, -0.2552490234375, -0.24615478515625, -0.237060546875, -0.22796630859375, -0.2188720703125, -0.20977783203125, -0.20068359375, -0.19158935546875, -0.1824951171875, -0.17340087890625, -0.164306640625, -0.15521240234375, -0.1461181640625, -0.13702392578125, -0.1279296875, -0.11883544921875, -0.1097412109375, -0.10064697265625, -0.091552734375, -0.08245849609375, -0.0733642578125, -0.06427001953125, -0.05517578125, -0.04608154296875, -0.0369873046875, -0.02789306640625, -0.018798828125, -0.00970458984375, -0.0006103515625, 0.00848388671875, 0.017578125, 0.02667236328125, 0.0357666015625, 0.04486083984375, 0.053955078125, 0.06304931640625, 0.0721435546875, 0.08123779296875, 0.09033203125, 0.09942626953125, 0.1085205078125, 0.11761474609375, 0.126708984375, 0.13580322265625, 0.1448974609375, 0.15399169921875, 0.1630859375, 0.17218017578125, 0.1812744140625, 0.19036865234375, 0.199462890625, 0.20855712890625, 0.2176513671875, 0.22674560546875, 0.23583984375, 0.24493408203125, 0.2540283203125, 0.26312255859375, 0.272216796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 0.0, 4.0, 4.0, 9.0, 9.0, 13.0, 18.0, 32.0, 35.0, 43.0, 71.0, 86.0, 101.0, 111.0, 102.0, 94.0, 80.0, 56.0, 48.0, 28.0, 19.0, 9.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012230873107910156, -0.00011885538697242737, -0.00011540204286575317, -0.00011194869875907898, -0.00010849535465240479, -0.00010504201054573059, -0.0001015886664390564, -9.81353223323822e-05, -9.468197822570801e-05, -9.122863411903381e-05, -8.777529001235962e-05, -8.432194590568542e-05, -8.086860179901123e-05, -7.741525769233704e-05, -7.396191358566284e-05, -7.050856947898865e-05, -6.705522537231445e-05, -6.360188126564026e-05, -6.0148537158966064e-05, -5.669519305229187e-05, -5.3241848945617676e-05, -4.978850483894348e-05, -4.633516073226929e-05, -4.288181662559509e-05, -3.94284725189209e-05, -3.5975128412246704e-05, -3.252178430557251e-05, -2.9068440198898315e-05, -2.561509609222412e-05, -2.2161751985549927e-05, -1.8708407878875732e-05, -1.5255063772201538e-05, -1.1801719665527344e-05, -8.34837555885315e-06, -4.895031452178955e-06, -1.4416873455047607e-06, 2.0116567611694336e-06, 5.465000867843628e-06, 8.918344974517822e-06, 1.2371689081192017e-05, 1.582503318786621e-05, 1.9278377294540405e-05, 2.27317214012146e-05, 2.6185065507888794e-05, 2.9638409614562988e-05, 3.309175372123718e-05, 3.654509782791138e-05, 3.999844193458557e-05, 4.3451786041259766e-05, 4.690513014793396e-05, 5.0358474254608154e-05, 5.381181836128235e-05, 5.726516246795654e-05, 6.071850657463074e-05, 6.417185068130493e-05, 6.762519478797913e-05, 7.107853889465332e-05, 7.453188300132751e-05, 7.798522710800171e-05, 8.14385712146759e-05, 8.48919153213501e-05, 8.834525942802429e-05, 9.179860353469849e-05, 9.525194764137268e-05, 9.870529174804688e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 13.0, 30.0, 42.0, 61.0, 113.0, 190.0, 319.0, 559.0, 1112.0, 2150.0, 4234.0, 9079.0, 20924.0, 48609.0, 104120.0, 184211.0, 237816.0, 203582.0, 123799.0, 59578.0, 26027.0, 11378.0, 5060.0, 2563.0, 1329.0, 717.0, 408.0, 207.0, 133.0, 72.0, 35.0, 27.0, 14.0, 10.0, 10.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36669921875, -0.356109619140625, -0.34552001953125, -0.334930419921875, -0.3243408203125, -0.313751220703125, -0.30316162109375, -0.292572021484375, -0.281982421875, -0.271392822265625, -0.26080322265625, -0.250213623046875, -0.2396240234375, -0.229034423828125, -0.21844482421875, -0.207855224609375, -0.197265625, -0.186676025390625, -0.17608642578125, -0.165496826171875, -0.1549072265625, -0.144317626953125, -0.13372802734375, -0.123138427734375, -0.112548828125, -0.101959228515625, -0.09136962890625, -0.080780029296875, -0.0701904296875, -0.059600830078125, -0.04901123046875, -0.038421630859375, -0.02783203125, -0.017242431640625, -0.00665283203125, 0.003936767578125, 0.0145263671875, 0.025115966796875, 0.03570556640625, 0.046295166015625, 0.056884765625, 0.067474365234375, 0.07806396484375, 0.088653564453125, 0.0992431640625, 0.109832763671875, 0.12042236328125, 0.131011962890625, 0.1416015625, 0.152191162109375, 0.16278076171875, 0.173370361328125, 0.1839599609375, 0.194549560546875, 0.20513916015625, 0.215728759765625, 0.226318359375, 0.236907958984375, 0.24749755859375, 0.258087158203125, 0.2686767578125, 0.279266357421875, 0.28985595703125, 0.300445556640625, 0.31103515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 3.0, 2.0, 5.0, 12.0, 7.0, 16.0, 17.0, 15.0, 26.0, 30.0, 28.0, 39.0, 39.0, 48.0, 45.0, 48.0, 46.0, 63.0, 55.0, 48.0, 65.0, 46.0, 41.0, 35.0, 21.0, 42.0, 29.0, 21.0, 19.0, 28.0, 12.0, 11.0, 11.0, 10.0, 2.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.283935546875, -0.2748870849609375, -0.265838623046875, -0.2567901611328125, -0.24774169921875, -0.2386932373046875, -0.229644775390625, -0.2205963134765625, -0.2115478515625, -0.2024993896484375, -0.193450927734375, -0.1844024658203125, -0.17535400390625, -0.1663055419921875, -0.157257080078125, -0.1482086181640625, -0.13916015625, -0.1301116943359375, -0.121063232421875, -0.1120147705078125, -0.10296630859375, -0.0939178466796875, -0.084869384765625, -0.0758209228515625, -0.0667724609375, -0.0577239990234375, -0.048675537109375, -0.0396270751953125, -0.03057861328125, -0.0215301513671875, -0.012481689453125, -0.0034332275390625, 0.005615234375, 0.0146636962890625, 0.023712158203125, 0.0327606201171875, 0.04180908203125, 0.0508575439453125, 0.059906005859375, 0.0689544677734375, 0.0780029296875, 0.0870513916015625, 0.096099853515625, 0.1051483154296875, 0.11419677734375, 0.1232452392578125, 0.132293701171875, 0.1413421630859375, 0.150390625, 0.1594390869140625, 0.168487548828125, 0.1775360107421875, 0.18658447265625, 0.1956329345703125, 0.204681396484375, 0.2137298583984375, 0.2227783203125, 0.2318267822265625, 0.240875244140625, 0.2499237060546875, 0.25897216796875, 0.2680206298828125, 0.277069091796875, 0.2861175537109375, 0.295166015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 8.0, 15.0, 16.0, 34.0, 43.0, 63.0, 77.0, 90.0, 89.0, 112.0, 102.0, 100.0, 75.0, 61.0, 44.0, 37.0, 14.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.326821804046631, -7.169806957244873, -7.012792587280273, -6.855777740478516, -6.698762893676758, -6.541748046875, -6.384733200073242, -6.227718830108643, -6.070703983306885, -5.913689136505127, -5.756674766540527, -5.5996599197387695, -5.442645072937012, -5.285630226135254, -5.128615379333496, -4.9716010093688965, -4.814586162567139, -4.657571315765381, -4.500556945800781, -4.343542098999023, -4.186527252197266, -4.029512405395508, -3.872497797012329, -3.7154831886291504, -3.5584683418273926, -3.4014534950256348, -3.244438886642456, -3.0874242782592773, -2.9304094314575195, -2.7733945846557617, -2.616379976272583, -2.4593653678894043, -2.3023500442504883, -2.1453351974487305, -1.9883205890655518, -1.8313058614730835, -1.6742911338806152, -1.517276406288147, -1.3602616786956787, -1.2032469511032104, -1.0462322235107422, -0.8892174959182739, -0.7322027683258057, -0.5751880407333374, -0.41817331314086914, -0.2611585855484009, -0.10414385795593262, 0.052870869636535645, 0.2098855972290039, 0.36690032482147217, 0.5239150524139404, 0.6809297800064087, 0.837944507598877, 0.9949592351913452, 1.1519739627838135, 1.3089886903762817, 1.46600341796875, 1.6230181455612183, 1.7800328731536865, 1.9370476007461548, 2.094062328338623, 2.251077175140381, 2.4080917835235596, 2.5651063919067383, 2.722121238708496]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 9.0, 3.0, 5.0, 7.0, 6.0, 9.0, 6.0, 9.0, 12.0, 12.0, 18.0, 23.0, 28.0, 23.0, 27.0, 30.0, 37.0, 38.0, 43.0, 43.0, 34.0, 55.0, 36.0, 36.0, 36.0, 51.0, 36.0, 30.0, 33.0, 35.0, 23.0, 35.0, 29.0, 20.0, 22.0, 33.0, 18.0, 15.0, 10.0, 11.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.1466610431671143, -3.0448029041290283, -2.9429447650909424, -2.8410866260528564, -2.7392284870147705, -2.6373703479766846, -2.5355124473571777, -2.433654308319092, -2.331796169281006, -2.22993803024292, -2.128079891204834, -2.026221752166748, -1.924363613128662, -1.8225054740905762, -1.7206474542617798, -1.6187893152236938, -1.5169310569763184, -1.4150729179382324, -1.3132147789001465, -1.2113566398620605, -1.1094985008239746, -1.0076403617858887, -0.9057823419570923, -0.8039242029190063, -0.7020660638809204, -0.6002079248428345, -0.4983498156070709, -0.3964917063713074, -0.29463356733322144, -0.1927754282951355, -0.09091734886169434, 0.010940790176391602, 0.11279916763305664, 0.21465729176998138, 0.31651541590690613, 0.4183735251426697, 0.5202316641807556, 0.6220898032188416, 0.7239478826522827, 0.8258060216903687, 0.9276641607284546, 1.0295222997665405, 1.1313804388046265, 1.2332384586334229, 1.3350965976715088, 1.4369547367095947, 1.5388128757476807, 1.6406710147857666, 1.7425291538238525, 1.8443872928619385, 1.9462454319000244, 2.0481035709381104, 2.1499617099761963, 2.2518198490142822, 2.353677749633789, 2.455535888671875, 2.557394027709961, 2.659252166748047, 2.761110305786133, 2.8629684448242188, 2.9648265838623047, 3.0666847229003906, 3.1685428619384766, 3.2704010009765625, 3.3722591400146484]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 8.0, 5.0, 9.0, 11.0, 8.0, 24.0, 33.0, 44.0, 69.0, 101.0, 143.0, 217.0, 359.0, 651.0, 1276.0, 2731.0, 5906.0, 14426.0, 39253.0, 128096.0, 534715.0, 1802942.0, 1248449.0, 291359.0, 78021.0, 26456.0, 10344.0, 4314.0, 2084.0, 971.0, 568.0, 272.0, 154.0, 99.0, 53.0, 40.0, 21.0, 14.0, 7.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.80078125, -0.7763671875, -0.751953125, -0.7275390625, -0.703125, -0.6787109375, -0.654296875, -0.6298828125, -0.60546875, -0.5810546875, -0.556640625, -0.5322265625, -0.5078125, -0.4833984375, -0.458984375, -0.4345703125, -0.41015625, -0.3857421875, -0.361328125, -0.3369140625, -0.3125, -0.2880859375, -0.263671875, -0.2392578125, -0.21484375, -0.1904296875, -0.166015625, -0.1416015625, -0.1171875, -0.0927734375, -0.068359375, -0.0439453125, -0.01953125, 0.0048828125, 0.029296875, 0.0537109375, 0.078125, 0.1025390625, 0.126953125, 0.1513671875, 0.17578125, 0.2001953125, 0.224609375, 0.2490234375, 0.2734375, 0.2978515625, 0.322265625, 0.3466796875, 0.37109375, 0.3955078125, 0.419921875, 0.4443359375, 0.46875, 0.4931640625, 0.517578125, 0.5419921875, 0.56640625, 0.5908203125, 0.615234375, 0.6396484375, 0.6640625, 0.6884765625, 0.712890625, 0.7373046875, 0.76171875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 11.0, 10.0, 21.0, 19.0, 21.0, 21.0, 40.0, 28.0, 41.0, 36.0, 53.0, 63.0, 72.0, 63.0, 57.0, 54.0, 50.0, 54.0, 47.0, 59.0, 40.0, 25.0, 28.0, 13.0, 11.0, 16.0, 13.0, 8.0, 4.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.5994873046875, -0.582275390625, -0.5650634765625, -0.5478515625, -0.5306396484375, -0.513427734375, -0.4962158203125, -0.47900390625, -0.4617919921875, -0.444580078125, -0.4273681640625, -0.41015625, -0.3929443359375, -0.375732421875, -0.3585205078125, -0.34130859375, -0.3240966796875, -0.306884765625, -0.2896728515625, -0.2724609375, -0.2552490234375, -0.238037109375, -0.2208251953125, -0.20361328125, -0.1864013671875, -0.169189453125, -0.1519775390625, -0.134765625, -0.1175537109375, -0.100341796875, -0.0831298828125, -0.06591796875, -0.0487060546875, -0.031494140625, -0.0142822265625, 0.0029296875, 0.0201416015625, 0.037353515625, 0.0545654296875, 0.07177734375, 0.0889892578125, 0.106201171875, 0.1234130859375, 0.140625, 0.1578369140625, 0.175048828125, 0.1922607421875, 0.20947265625, 0.2266845703125, 0.243896484375, 0.2611083984375, 0.2783203125, 0.2955322265625, 0.312744140625, 0.3299560546875, 0.34716796875, 0.3643798828125, 0.381591796875, 0.3988037109375, 0.416015625, 0.4332275390625, 0.450439453125, 0.4676513671875, 0.48486328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 9.0, 8.0, 13.0, 23.0, 33.0, 48.0, 63.0, 155.0, 263.0, 554.0, 1560.0, 6115.0, 31325.0, 212412.0, 1605767.0, 1994807.0, 289612.0, 40599.0, 7565.0, 1996.0, 666.0, 310.0, 128.0, 92.0, 56.0, 39.0, 15.0, 14.0, 9.0, 11.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3115234375, -1.269317626953125, -1.22711181640625, -1.184906005859375, -1.1427001953125, -1.100494384765625, -1.05828857421875, -1.016082763671875, -0.973876953125, -0.931671142578125, -0.88946533203125, -0.847259521484375, -0.8050537109375, -0.762847900390625, -0.72064208984375, -0.678436279296875, -0.63623046875, -0.594024658203125, -0.55181884765625, -0.509613037109375, -0.4674072265625, -0.425201416015625, -0.38299560546875, -0.340789794921875, -0.298583984375, -0.256378173828125, -0.21417236328125, -0.171966552734375, -0.1297607421875, -0.087554931640625, -0.04534912109375, -0.003143310546875, 0.0390625, 0.081268310546875, 0.12347412109375, 0.165679931640625, 0.2078857421875, 0.250091552734375, 0.29229736328125, 0.334503173828125, 0.376708984375, 0.418914794921875, 0.46112060546875, 0.503326416015625, 0.5455322265625, 0.587738037109375, 0.62994384765625, 0.672149658203125, 0.71435546875, 0.756561279296875, 0.79876708984375, 0.840972900390625, 0.8831787109375, 0.925384521484375, 0.96759033203125, 1.009796142578125, 1.052001953125, 1.094207763671875, 1.13641357421875, 1.178619384765625, 1.2208251953125, 1.263031005859375, 1.30523681640625, 1.347442626953125, 1.3896484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 10.0, 4.0, 12.0, 14.0, 20.0, 30.0, 37.0, 51.0, 62.0, 95.0, 110.0, 153.0, 212.0, 272.0, 310.0, 328.0, 397.0, 372.0, 299.0, 270.0, 239.0, 188.0, 147.0, 118.0, 92.0, 50.0, 51.0, 41.0, 25.0, 19.0, 12.0, 8.0, 5.0, 4.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7353515625, -0.7135467529296875, -0.691741943359375, -0.6699371337890625, -0.64813232421875, -0.6263275146484375, -0.604522705078125, -0.5827178955078125, -0.5609130859375, -0.5391082763671875, -0.517303466796875, -0.4954986572265625, -0.47369384765625, -0.4518890380859375, -0.430084228515625, -0.4082794189453125, -0.386474609375, -0.3646697998046875, -0.342864990234375, -0.3210601806640625, -0.29925537109375, -0.2774505615234375, -0.255645751953125, -0.2338409423828125, -0.2120361328125, -0.1902313232421875, -0.168426513671875, -0.1466217041015625, -0.12481689453125, -0.1030120849609375, -0.081207275390625, -0.0594024658203125, -0.03759765625, -0.0157928466796875, 0.006011962890625, 0.0278167724609375, 0.04962158203125, 0.0714263916015625, 0.093231201171875, 0.1150360107421875, 0.1368408203125, 0.1586456298828125, 0.180450439453125, 0.2022552490234375, 0.22406005859375, 0.2458648681640625, 0.267669677734375, 0.2894744873046875, 0.311279296875, 0.3330841064453125, 0.354888916015625, 0.3766937255859375, 0.39849853515625, 0.4203033447265625, 0.442108154296875, 0.4639129638671875, 0.4857177734375, 0.5075225830078125, 0.529327392578125, 0.5511322021484375, 0.57293701171875, 0.5947418212890625, 0.616546630859375, 0.6383514404296875, 0.66015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 7.0, 20.0, 36.0, 68.0, 93.0, 128.0, 129.0, 126.0, 133.0, 88.0, 54.0, 55.0, 22.0, 22.0, 11.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.044299125671387, -8.860620498657227, -8.676941871643066, -8.493263244628906, -8.309584617614746, -8.125905990600586, -7.942227363586426, -7.758548736572266, -7.5748701095581055, -7.391191482543945, -7.207512855529785, -7.023834228515625, -6.840155601501465, -6.656476974487305, -6.4727983474731445, -6.289119720458984, -6.105441093444824, -5.921762466430664, -5.738083839416504, -5.554405212402344, -5.370726585388184, -5.187047958374023, -5.003369331359863, -4.819690704345703, -4.636012554168701, -4.452333927154541, -4.268655300140381, -4.084976673126221, -3.9012980461120605, -3.7176194190979004, -3.5339407920837402, -3.35026216506958, -3.16658353805542, -2.9829049110412598, -2.7992262840270996, -2.6155476570129395, -2.4318690299987793, -2.248190402984619, -2.064511775970459, -1.8808332681655884, -1.6971546411514282, -1.513476014137268, -1.329797387123108, -1.1461188793182373, -0.9624401926994324, -0.7787615656852722, -0.5950829982757568, -0.4114043712615967, -0.22772574424743652, -0.04404713213443756, 0.1396314799785614, 0.32331007719039917, 0.5069887042045593, 0.6906673312187195, 0.8743458986282349, 1.058024525642395, 1.2417031526565552, 1.4253817796707153, 1.6090604066848755, 1.792738914489746, 1.9764175415039062, 2.1600961685180664, 2.3437747955322266, 2.5274534225463867, 2.711132049560547]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 7.0, 5.0, 5.0, 11.0, 10.0, 16.0, 22.0, 17.0, 20.0, 14.0, 15.0, 18.0, 35.0, 27.0, 20.0, 26.0, 37.0, 43.0, 31.0, 43.0, 40.0, 39.0, 44.0, 32.0, 45.0, 37.0, 31.0, 42.0, 35.0, 24.0, 35.0, 20.0, 24.0, 16.0, 18.0, 14.0, 11.0, 19.0, 12.0, 11.0, 5.0, 8.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.0095295906066895, -1.940954327583313, -1.8723790645599365, -1.8038036823272705, -1.735228419303894, -1.6666531562805176, -1.5980777740478516, -1.529502511024475, -1.4609272480010986, -1.3923519849777222, -1.3237767219543457, -1.2552013397216797, -1.1866260766983032, -1.1180508136749268, -1.0494754314422607, -0.9809001684188843, -0.9123249053955078, -0.8437496423721313, -0.7751743197441101, -0.7065989971160889, -0.6380237340927124, -0.5694484710693359, -0.5008731484413147, -0.43229785561561584, -0.363722562789917, -0.29514726996421814, -0.2265719771385193, -0.15799668431282043, -0.08942139148712158, -0.02084609866142273, 0.04772919416427612, 0.11630448698997498, 0.18487954139709473, 0.2534548342227936, 0.32203012704849243, 0.3906054198741913, 0.45918071269989014, 0.5277559757232666, 0.5963312983512878, 0.6649066209793091, 0.7334818840026855, 0.802057147026062, 0.8706324696540833, 0.9392077922821045, 1.007783055305481, 1.0763583183288574, 1.1449337005615234, 1.2135089635849, 1.2820842266082764, 1.3506594896316528, 1.4192347526550293, 1.4878101348876953, 1.5563853979110718, 1.6249606609344482, 1.6935360431671143, 1.7621113061904907, 1.8306865692138672, 1.8992618322372437, 1.9678370952606201, 2.036412477493286, 2.104987621307373, 2.173563003540039, 2.242138385772705, 2.310713529586792, 2.379288911819458]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 13.0, 15.0, 14.0, 22.0, 31.0, 24.0, 41.0, 77.0, 123.0, 244.0, 471.0, 927.0, 1888.0, 4133.0, 9506.0, 22495.0, 54832.0, 134378.0, 275672.0, 288912.0, 148715.0, 61760.0, 24819.0, 10547.0, 4616.0, 2075.0, 991.0, 513.0, 268.0, 149.0, 87.0, 49.0, 33.0, 24.0, 23.0, 15.0, 14.0, 5.0, 5.0, 5.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0703125, -2.0076904296875, -1.945068359375, -1.8824462890625, -1.81982421875, -1.7572021484375, -1.694580078125, -1.6319580078125, -1.5693359375, -1.5067138671875, -1.444091796875, -1.3814697265625, -1.31884765625, -1.2562255859375, -1.193603515625, -1.1309814453125, -1.068359375, -1.0057373046875, -0.943115234375, -0.8804931640625, -0.81787109375, -0.7552490234375, -0.692626953125, -0.6300048828125, -0.5673828125, -0.5047607421875, -0.442138671875, -0.3795166015625, -0.31689453125, -0.2542724609375, -0.191650390625, -0.1290283203125, -0.06640625, -0.0037841796875, 0.058837890625, 0.1214599609375, 0.18408203125, 0.2467041015625, 0.309326171875, 0.3719482421875, 0.4345703125, 0.4971923828125, 0.559814453125, 0.6224365234375, 0.68505859375, 0.7476806640625, 0.810302734375, 0.8729248046875, 0.935546875, 0.9981689453125, 1.060791015625, 1.1234130859375, 1.18603515625, 1.2486572265625, 1.311279296875, 1.3739013671875, 1.4365234375, 1.4991455078125, 1.561767578125, 1.6243896484375, 1.68701171875, 1.7496337890625, 1.812255859375, 1.8748779296875, 1.9375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 11.0, 9.0, 12.0, 24.0, 24.0, 36.0, 25.0, 33.0, 32.0, 53.0, 58.0, 66.0, 65.0, 70.0, 63.0, 60.0, 56.0, 57.0, 47.0, 42.0, 42.0, 25.0, 26.0, 16.0, 13.0, 11.0, 7.0, 10.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6220703125, -0.6041183471679688, -0.5861663818359375, -0.5682144165039062, -0.550262451171875, -0.5323104858398438, -0.5143585205078125, -0.49640655517578125, -0.47845458984375, -0.46050262451171875, -0.4425506591796875, -0.42459869384765625, -0.406646728515625, -0.38869476318359375, -0.3707427978515625, -0.35279083251953125, -0.3348388671875, -0.31688690185546875, -0.2989349365234375, -0.28098297119140625, -0.263031005859375, -0.24507904052734375, -0.2271270751953125, -0.20917510986328125, -0.19122314453125, -0.17327117919921875, -0.1553192138671875, -0.13736724853515625, -0.119415283203125, -0.10146331787109375, -0.0835113525390625, -0.06555938720703125, -0.047607421875, -0.02965545654296875, -0.0117034912109375, 0.00624847412109375, 0.024200439453125, 0.04215240478515625, 0.0601043701171875, 0.07805633544921875, 0.09600830078125, 0.11396026611328125, 0.1319122314453125, 0.14986419677734375, 0.167816162109375, 0.18576812744140625, 0.2037200927734375, 0.22167205810546875, 0.2396240234375, 0.25757598876953125, 0.2755279541015625, 0.29347991943359375, 0.311431884765625, 0.32938385009765625, 0.3473358154296875, 0.36528778076171875, 0.38323974609375, 0.40119171142578125, 0.4191436767578125, 0.43709564208984375, 0.455047607421875, 0.47299957275390625, 0.4909515380859375, 0.5089035034179688, 0.52685546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 1.0, 13.0, 11.0, 18.0, 22.0, 34.0, 36.0, 38.0, 86.0, 101.0, 162.0, 240.0, 446.0, 671.0, 1198.0, 2149.0, 4088.0, 7706.0, 14700.0, 28591.0, 54606.0, 96781.0, 153603.0, 197925.0, 185874.0, 131288.0, 78126.0, 42709.0, 22395.0, 11543.0, 6021.0, 3132.0, 1747.0, 936.0, 602.0, 323.0, 215.0, 133.0, 81.0, 56.0, 37.0, 27.0, 24.0, 18.0, 12.0, 10.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0986328125, -1.0629730224609375, -1.027313232421875, -0.9916534423828125, -0.95599365234375, -0.9203338623046875, -0.884674072265625, -0.8490142822265625, -0.8133544921875, -0.7776947021484375, -0.742034912109375, -0.7063751220703125, -0.67071533203125, -0.6350555419921875, -0.599395751953125, -0.5637359619140625, -0.528076171875, -0.4924163818359375, -0.456756591796875, -0.4210968017578125, -0.38543701171875, -0.3497772216796875, -0.314117431640625, -0.2784576416015625, -0.2427978515625, -0.2071380615234375, -0.171478271484375, -0.1358184814453125, -0.10015869140625, -0.0644989013671875, -0.028839111328125, 0.0068206787109375, 0.04248046875, 0.0781402587890625, 0.113800048828125, 0.1494598388671875, 0.18511962890625, 0.2207794189453125, 0.256439208984375, 0.2920989990234375, 0.3277587890625, 0.3634185791015625, 0.399078369140625, 0.4347381591796875, 0.47039794921875, 0.5060577392578125, 0.541717529296875, 0.5773773193359375, 0.613037109375, 0.6486968994140625, 0.684356689453125, 0.7200164794921875, 0.75567626953125, 0.7913360595703125, 0.826995849609375, 0.8626556396484375, 0.8983154296875, 0.9339752197265625, 0.969635009765625, 1.0052947998046875, 1.04095458984375, 1.0766143798828125, 1.112274169921875, 1.1479339599609375, 1.18359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 9.0, 5.0, 7.0, 4.0, 7.0, 8.0, 14.0, 21.0, 31.0, 26.0, 22.0, 33.0, 30.0, 39.0, 28.0, 35.0, 43.0, 39.0, 49.0, 54.0, 49.0, 39.0, 45.0, 38.0, 35.0, 60.0, 30.0, 30.0, 27.0, 15.0, 30.0, 19.0, 20.0, 11.0, 23.0, 10.0, 4.0, 4.0, 5.0, 2.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3857421875, -1.3457794189453125, -1.305816650390625, -1.2658538818359375, -1.22589111328125, -1.1859283447265625, -1.145965576171875, -1.1060028076171875, -1.0660400390625, -1.0260772705078125, -0.986114501953125, -0.9461517333984375, -0.90618896484375, -0.8662261962890625, -0.826263427734375, -0.7863006591796875, -0.746337890625, -0.7063751220703125, -0.666412353515625, -0.6264495849609375, -0.58648681640625, -0.5465240478515625, -0.506561279296875, -0.4665985107421875, -0.4266357421875, -0.3866729736328125, -0.346710205078125, -0.3067474365234375, -0.26678466796875, -0.2268218994140625, -0.186859130859375, -0.1468963623046875, -0.10693359375, -0.0669708251953125, -0.027008056640625, 0.0129547119140625, 0.05291748046875, 0.0928802490234375, 0.132843017578125, 0.1728057861328125, 0.2127685546875, 0.2527313232421875, 0.292694091796875, 0.3326568603515625, 0.37261962890625, 0.4125823974609375, 0.452545166015625, 0.4925079345703125, 0.532470703125, 0.5724334716796875, 0.612396240234375, 0.6523590087890625, 0.69232177734375, 0.7322845458984375, 0.772247314453125, 0.8122100830078125, 0.8521728515625, 0.8921356201171875, 0.932098388671875, 0.9720611572265625, 1.01202392578125, 1.0519866943359375, 1.091949462890625, 1.1319122314453125, 1.171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 11.0, 19.0, 20.0, 32.0, 49.0, 74.0, 113.0, 187.0, 289.0, 457.0, 687.0, 1121.0, 1729.0, 2955.0, 4815.0, 8327.0, 14426.0, 27075.0, 51342.0, 94790.0, 161400.0, 215671.0, 191871.0, 122276.0, 67950.0, 35514.0, 19009.0, 10479.0, 6101.0, 3709.0, 2220.0, 1385.0, 867.0, 542.0, 388.0, 224.0, 159.0, 82.0, 62.0, 42.0, 30.0, 18.0, 12.0, 7.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.50390625, -0.4885063171386719, -0.47310638427734375, -0.4577064514160156, -0.4423065185546875, -0.4269065856933594, -0.41150665283203125, -0.3961067199707031, -0.380706787109375, -0.3653068542480469, -0.34990692138671875, -0.3345069885253906, -0.3191070556640625, -0.3037071228027344, -0.28830718994140625, -0.2729072570800781, -0.25750732421875, -0.24210739135742188, -0.22670745849609375, -0.21130752563476562, -0.1959075927734375, -0.18050765991210938, -0.16510772705078125, -0.14970779418945312, -0.134307861328125, -0.11890792846679688, -0.10350799560546875, -0.08810806274414062, -0.0727081298828125, -0.057308197021484375, -0.04190826416015625, -0.026508331298828125, -0.0111083984375, 0.004291534423828125, 0.01969146728515625, 0.035091400146484375, 0.0504913330078125, 0.06589126586914062, 0.08129119873046875, 0.09669113159179688, 0.112091064453125, 0.12749099731445312, 0.14289093017578125, 0.15829086303710938, 0.1736907958984375, 0.18909072875976562, 0.20449066162109375, 0.21989059448242188, 0.23529052734375, 0.2506904602050781, 0.26609039306640625, 0.2814903259277344, 0.2968902587890625, 0.3122901916503906, 0.32769012451171875, 0.3430900573730469, 0.358489990234375, 0.3738899230957031, 0.38928985595703125, 0.4046897888183594, 0.4200897216796875, 0.4354896545410156, 0.45088958740234375, 0.4662895202636719, 0.481689453125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 16.0, 15.0, 18.0, 30.0, 49.0, 67.0, 90.0, 149.0, 171.0, 138.0, 101.0, 50.0, 35.0, 23.0, 13.0, 11.0, 7.0, 5.0, 9.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022411346435546875, -0.00021554529666900635, -0.00020697712898254395, -0.00019840896129608154, -0.00018984079360961914, -0.00018127262592315674, -0.00017270445823669434, -0.00016413629055023193, -0.00015556812286376953, -0.00014699995517730713, -0.00013843178749084473, -0.00012986361980438232, -0.00012129545211791992, -0.00011272728443145752, -0.00010415911674499512, -9.559094905853271e-05, -8.702278137207031e-05, -7.845461368560791e-05, -6.988644599914551e-05, -6.13182783126831e-05, -5.27501106262207e-05, -4.41819429397583e-05, -3.56137752532959e-05, -2.7045607566833496e-05, -1.8477439880371094e-05, -9.909272193908691e-06, -1.341104507446289e-06, 7.227063179016113e-06, 1.5795230865478516e-05, 2.4363398551940918e-05, 3.293156623840332e-05, 4.149973392486572e-05, 5.0067901611328125e-05, 5.863606929779053e-05, 6.720423698425293e-05, 7.577240467071533e-05, 8.434057235717773e-05, 9.290874004364014e-05, 0.00010147690773010254, 0.00011004507541656494, 0.00011861324310302734, 0.00012718141078948975, 0.00013574957847595215, 0.00014431774616241455, 0.00015288591384887695, 0.00016145408153533936, 0.00017002224922180176, 0.00017859041690826416, 0.00018715858459472656, 0.00019572675228118896, 0.00020429491996765137, 0.00021286308765411377, 0.00022143125534057617, 0.00022999942302703857, 0.00023856759071350098, 0.0002471357583999634, 0.0002557039260864258, 0.0002642720937728882, 0.0002728402614593506, 0.000281408429145813, 0.0002899765968322754, 0.0002985447645187378, 0.0003071129322052002, 0.0003156810998916626, 0.000324249267578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 12.0, 27.0, 37.0, 55.0, 70.0, 151.0, 249.0, 429.0, 814.0, 1276.0, 2360.0, 4484.0, 8927.0, 18729.0, 43721.0, 107511.0, 238961.0, 304476.0, 180875.0, 75499.0, 31195.0, 13969.0, 6849.0, 3458.0, 1860.0, 1095.0, 623.0, 352.0, 202.0, 113.0, 59.0, 35.0, 31.0, 10.0, 10.0, 9.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7041015625, -0.6847076416015625, -0.665313720703125, -0.6459197998046875, -0.62652587890625, -0.6071319580078125, -0.587738037109375, -0.5683441162109375, -0.5489501953125, -0.5295562744140625, -0.510162353515625, -0.4907684326171875, -0.47137451171875, -0.4519805908203125, -0.432586669921875, -0.4131927490234375, -0.393798828125, -0.3744049072265625, -0.355010986328125, -0.3356170654296875, -0.31622314453125, -0.2968292236328125, -0.277435302734375, -0.2580413818359375, -0.2386474609375, -0.2192535400390625, -0.199859619140625, -0.1804656982421875, -0.16107177734375, -0.1416778564453125, -0.122283935546875, -0.1028900146484375, -0.08349609375, -0.0641021728515625, -0.044708251953125, -0.0253143310546875, -0.00592041015625, 0.0134735107421875, 0.032867431640625, 0.0522613525390625, 0.0716552734375, 0.0910491943359375, 0.110443115234375, 0.1298370361328125, 0.14923095703125, 0.1686248779296875, 0.188018798828125, 0.2074127197265625, 0.226806640625, 0.2462005615234375, 0.265594482421875, 0.2849884033203125, 0.30438232421875, 0.3237762451171875, 0.343170166015625, 0.3625640869140625, 0.3819580078125, 0.4013519287109375, 0.420745849609375, 0.4401397705078125, 0.45953369140625, 0.4789276123046875, 0.498321533203125, 0.5177154541015625, 0.537109375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 10.0, 12.0, 18.0, 18.0, 31.0, 33.0, 47.0, 53.0, 72.0, 65.0, 72.0, 82.0, 71.0, 68.0, 63.0, 51.0, 39.0, 34.0, 30.0, 22.0, 18.0, 14.0, 15.0, 11.0, 9.0, 2.0, 5.0, 1.0, 4.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4208183288574219, -0.40438079833984375, -0.3879432678222656, -0.3715057373046875, -0.3550682067871094, -0.33863067626953125, -0.3221931457519531, -0.305755615234375, -0.2893180847167969, -0.27288055419921875, -0.2564430236816406, -0.2400054931640625, -0.22356796264648438, -0.20713043212890625, -0.19069290161132812, -0.17425537109375, -0.15781784057617188, -0.14138031005859375, -0.12494277954101562, -0.1085052490234375, -0.09206771850585938, -0.07563018798828125, -0.059192657470703125, -0.042755126953125, -0.026317596435546875, -0.00988006591796875, 0.006557464599609375, 0.0229949951171875, 0.039432525634765625, 0.05587005615234375, 0.07230758666992188, 0.0887451171875, 0.10518264770507812, 0.12162017822265625, 0.13805770874023438, 0.1544952392578125, 0.17093276977539062, 0.18737030029296875, 0.20380783081054688, 0.220245361328125, 0.23668289184570312, 0.25312042236328125, 0.2695579528808594, 0.2859954833984375, 0.3024330139160156, 0.31887054443359375, 0.3353080749511719, 0.35174560546875, 0.3681831359863281, 0.38462066650390625, 0.4010581970214844, 0.4174957275390625, 0.4339332580566406, 0.45037078857421875, 0.4668083190917969, 0.483245849609375, 0.4996833801269531, 0.5161209106445312, 0.5325584411621094, 0.5489959716796875, 0.5654335021972656, 0.5818710327148438, 0.5983085632324219, 0.61474609375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 11.0, 25.0, 23.0, 34.0, 41.0, 61.0, 71.0, 96.0, 103.0, 99.0, 81.0, 78.0, 60.0, 69.0, 35.0, 39.0, 25.0, 15.0, 14.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.17110013961792, -4.97287654876709, -4.774653434753418, -4.576429843902588, -4.378206253051758, -4.179983139038086, -3.981759548187256, -3.783536195755005, -3.585312843322754, -3.387089490890503, -3.188866138458252, -2.990642547607422, -2.792419195175171, -2.59419584274292, -2.39597225189209, -2.197748899459839, -1.999525547027588, -1.801302194595337, -1.6030787229537964, -1.4048552513122559, -1.2066318988800049, -1.008408546447754, -0.8101850748062134, -0.6119616031646729, -0.4137382507324219, -0.21551483869552612, -0.01729142665863037, 0.18093198537826538, 0.37915539741516113, 0.5773788094520569, 0.7756022214889526, 0.9738256931304932, 1.172048568725586, 1.370271921157837, 1.5684953927993774, 1.766718864440918, 1.964942216873169, 2.16316556930542, 2.36138916015625, 2.559612512588501, 2.757835865020752, 2.956059217453003, 3.154282569885254, 3.352506160736084, 3.550729513168335, 3.748952865600586, 3.947176456451416, 4.145400047302246, 4.343623161315918, 4.541846752166748, 4.74006986618042, 4.93829345703125, 5.136516571044922, 5.334740161895752, 5.532963752746582, 5.731186866760254, 5.929410457611084, 6.127634048461914, 6.325857162475586, 6.524080753326416, 6.722304344177246, 6.920527458190918, 7.118751049041748, 7.316974639892578, 7.51519775390625]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 1.0, 9.0, 5.0, 10.0, 8.0, 9.0, 20.0, 12.0, 19.0, 26.0, 25.0, 33.0, 28.0, 29.0, 33.0, 26.0, 38.0, 46.0, 38.0, 46.0, 37.0, 43.0, 44.0, 52.0, 42.0, 30.0, 31.0, 28.0, 26.0, 25.0, 25.0, 30.0, 15.0, 16.0, 16.0, 16.0, 12.0, 16.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 6.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.271702766418457, -4.145228862762451, -4.018754959106445, -3.8922808170318604, -3.7658066749572754, -3.6393327713012695, -3.5128588676452637, -3.3863847255706787, -3.2599105834960938, -3.133436679840088, -3.006962537765503, -2.880488634109497, -2.754014492034912, -2.6275405883789062, -2.5010666847229004, -2.3745925426483154, -2.2481186389923096, -2.1216447353363037, -1.9951705932617188, -1.868696689605713, -1.742222547531128, -1.615748643875122, -1.4892746210098267, -1.3628005981445312, -1.2363265752792358, -1.1098525524139404, -0.983378529548645, -0.8569045662879944, -0.730430543422699, -0.6039565205574036, -0.47748255729675293, -0.3510085344314575, -0.224534273147583, -0.09806026518344879, 0.028413742780685425, 0.15488773584365845, 0.28136175870895386, 0.40783578157424927, 0.5343097448348999, 0.6607837677001953, 0.7872577905654907, 0.9137318134307861, 1.0402058362960815, 1.166679859161377, 1.2931537628173828, 1.4196279048919678, 1.5461018085479736, 1.672575831413269, 1.7990498542785645, 1.9255238771438599, 2.0519979000091553, 2.178471803665161, 2.304945945739746, 2.431419849395752, 2.557893753051758, 2.6843678951263428, 2.8108420372009277, 2.9373159408569336, 3.0637900829315186, 3.1902639865875244, 3.3167381286621094, 3.4432120323181152, 3.569685935974121, 3.696160078048706, 3.822633981704712]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 6.0, 10.0, 7.0, 19.0, 19.0, 28.0, 30.0, 49.0, 77.0, 82.0, 156.0, 240.0, 398.0, 743.0, 1205.0, 2241.0, 4496.0, 9446.0, 21464.0, 53085.0, 149097.0, 484720.0, 1398976.0, 1364268.0, 467058.0, 144183.0, 52165.0, 21212.0, 9389.0, 4324.0, 2185.0, 1229.0, 652.0, 374.0, 236.0, 142.0, 98.0, 52.0, 36.0, 28.0, 16.0, 14.0, 8.0, 11.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.80078125, -0.7765045166015625, -0.752227783203125, -0.7279510498046875, -0.70367431640625, -0.6793975830078125, -0.655120849609375, -0.6308441162109375, -0.6065673828125, -0.5822906494140625, -0.558013916015625, -0.5337371826171875, -0.50946044921875, -0.4851837158203125, -0.460906982421875, -0.4366302490234375, -0.412353515625, -0.3880767822265625, -0.363800048828125, -0.3395233154296875, -0.31524658203125, -0.2909698486328125, -0.266693115234375, -0.2424163818359375, -0.2181396484375, -0.1938629150390625, -0.169586181640625, -0.1453094482421875, -0.12103271484375, -0.0967559814453125, -0.072479248046875, -0.0482025146484375, -0.02392578125, 0.0003509521484375, 0.024627685546875, 0.0489044189453125, 0.07318115234375, 0.0974578857421875, 0.121734619140625, 0.1460113525390625, 0.1702880859375, 0.1945648193359375, 0.218841552734375, 0.2431182861328125, 0.26739501953125, 0.2916717529296875, 0.315948486328125, 0.3402252197265625, 0.364501953125, 0.3887786865234375, 0.413055419921875, 0.4373321533203125, 0.46160888671875, 0.4858856201171875, 0.510162353515625, 0.5344390869140625, 0.5587158203125, 0.5829925537109375, 0.607269287109375, 0.6315460205078125, 0.65582275390625, 0.6800994873046875, 0.704376220703125, 0.7286529541015625, 0.7529296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 13.0, 11.0, 9.0, 6.0, 11.0, 18.0, 14.0, 28.0, 24.0, 23.0, 32.0, 36.0, 35.0, 33.0, 45.0, 42.0, 48.0, 51.0, 32.0, 34.0, 37.0, 33.0, 32.0, 41.0, 41.0, 50.0, 38.0, 30.0, 28.0, 16.0, 20.0, 17.0, 14.0, 11.0, 6.0, 9.0, 9.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5141258239746094, -0.49846649169921875, -0.4828071594238281, -0.4671478271484375, -0.4514884948730469, -0.43582916259765625, -0.4201698303222656, -0.404510498046875, -0.3888511657714844, -0.37319183349609375, -0.3575325012207031, -0.3418731689453125, -0.3262138366699219, -0.31055450439453125, -0.2948951721191406, -0.27923583984375, -0.2635765075683594, -0.24791717529296875, -0.23225784301757812, -0.2165985107421875, -0.20093917846679688, -0.18527984619140625, -0.16962051391601562, -0.153961181640625, -0.13830184936523438, -0.12264251708984375, -0.10698318481445312, -0.0913238525390625, -0.07566452026367188, -0.06000518798828125, -0.044345855712890625, -0.0286865234375, -0.013027191162109375, 0.00263214111328125, 0.018291473388671875, 0.0339508056640625, 0.049610137939453125, 0.06526947021484375, 0.08092880249023438, 0.096588134765625, 0.11224746704101562, 0.12790679931640625, 0.14356613159179688, 0.1592254638671875, 0.17488479614257812, 0.19054412841796875, 0.20620346069335938, 0.22186279296875, 0.23752212524414062, 0.25318145751953125, 0.2688407897949219, 0.2845001220703125, 0.3001594543457031, 0.31581878662109375, 0.3314781188964844, 0.347137451171875, 0.3627967834472656, 0.37845611572265625, 0.3941154479980469, 0.4097747802734375, 0.4254341125488281, 0.44109344482421875, 0.4567527770996094, 0.472412109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 9.0, 14.0, 16.0, 37.0, 40.0, 81.0, 139.0, 253.0, 573.0, 1205.0, 2704.0, 6994.0, 19700.0, 69792.0, 301988.0, 1360706.0, 1821736.0, 463378.0, 102082.0, 27342.0, 9100.0, 3500.0, 1468.0, 673.0, 327.0, 168.0, 90.0, 58.0, 44.0, 22.0, 18.0, 10.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3671875, -1.328277587890625, -1.28936767578125, -1.250457763671875, -1.2115478515625, -1.172637939453125, -1.13372802734375, -1.094818115234375, -1.055908203125, -1.016998291015625, -0.97808837890625, -0.939178466796875, -0.9002685546875, -0.861358642578125, -0.82244873046875, -0.783538818359375, -0.74462890625, -0.705718994140625, -0.66680908203125, -0.627899169921875, -0.5889892578125, -0.550079345703125, -0.51116943359375, -0.472259521484375, -0.433349609375, -0.394439697265625, -0.35552978515625, -0.316619873046875, -0.2777099609375, -0.238800048828125, -0.19989013671875, -0.160980224609375, -0.1220703125, -0.083160400390625, -0.04425048828125, -0.005340576171875, 0.0335693359375, 0.072479248046875, 0.11138916015625, 0.150299072265625, 0.189208984375, 0.228118896484375, 0.26702880859375, 0.305938720703125, 0.3448486328125, 0.383758544921875, 0.42266845703125, 0.461578369140625, 0.50048828125, 0.539398193359375, 0.57830810546875, 0.617218017578125, 0.6561279296875, 0.695037841796875, 0.73394775390625, 0.772857666015625, 0.811767578125, 0.850677490234375, 0.88958740234375, 0.928497314453125, 0.9674072265625, 1.006317138671875, 1.04522705078125, 1.084136962890625, 1.123046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 8.0, 6.0, 6.0, 7.0, 25.0, 30.0, 39.0, 55.0, 72.0, 106.0, 154.0, 181.0, 236.0, 341.0, 386.0, 441.0, 434.0, 397.0, 297.0, 222.0, 172.0, 147.0, 85.0, 53.0, 47.0, 38.0, 23.0, 20.0, 13.0, 9.0, 6.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8935546875, -0.8614654541015625, -0.829376220703125, -0.7972869873046875, -0.76519775390625, -0.7331085205078125, -0.701019287109375, -0.6689300537109375, -0.6368408203125, -0.6047515869140625, -0.572662353515625, -0.5405731201171875, -0.50848388671875, -0.4763946533203125, -0.444305419921875, -0.4122161865234375, -0.380126953125, -0.3480377197265625, -0.315948486328125, -0.2838592529296875, -0.25177001953125, -0.2196807861328125, -0.187591552734375, -0.1555023193359375, -0.1234130859375, -0.0913238525390625, -0.059234619140625, -0.0271453857421875, 0.00494384765625, 0.0370330810546875, 0.069122314453125, 0.1012115478515625, 0.13330078125, 0.1653900146484375, 0.197479248046875, 0.2295684814453125, 0.26165771484375, 0.2937469482421875, 0.325836181640625, 0.3579254150390625, 0.3900146484375, 0.4221038818359375, 0.454193115234375, 0.4862823486328125, 0.51837158203125, 0.5504608154296875, 0.582550048828125, 0.6146392822265625, 0.646728515625, 0.6788177490234375, 0.710906982421875, 0.7429962158203125, 0.77508544921875, 0.8071746826171875, 0.839263916015625, 0.8713531494140625, 0.9034423828125, 0.9355316162109375, 0.967620849609375, 0.9997100830078125, 1.03179931640625, 1.0638885498046875, 1.095977783203125, 1.1280670166015625, 1.16015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 12.0, 17.0, 21.0, 45.0, 61.0, 92.0, 134.0, 149.0, 125.0, 122.0, 93.0, 68.0, 29.0, 16.0, 14.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.489984512329102, -10.234557151794434, -9.979129791259766, -9.723702430725098, -9.46827507019043, -9.212847709655762, -8.957420349121094, -8.701992988586426, -8.446565628051758, -8.19113826751709, -7.935710906982422, -7.680283546447754, -7.424856185913086, -7.169428825378418, -6.91400146484375, -6.658574104309082, -6.403146743774414, -6.147719383239746, -5.892292022705078, -5.63686466217041, -5.381437301635742, -5.126009941101074, -4.870582580566406, -4.615155220031738, -4.35972785949707, -4.104300498962402, -3.8488731384277344, -3.5934457778930664, -3.3380184173583984, -3.0825910568237305, -2.8271636962890625, -2.5717363357543945, -2.3163089752197266, -2.0608816146850586, -1.8054542541503906, -1.5500268936157227, -1.2945995330810547, -1.0391721725463867, -0.7837448120117188, -0.5283174514770508, -0.2728900909423828, -0.017462730407714844, 0.23796463012695312, 0.4933919906616211, 0.7488193511962891, 1.004246711730957, 1.259674072265625, 1.515101432800293, 1.770528793334961, 2.025956153869629, 2.281383514404297, 2.536810874938965, 2.792238235473633, 3.047665596008301, 3.3030929565429688, 3.5585203170776367, 3.8139476776123047, 4.069375038146973, 4.324802398681641, 4.580229759216309, 4.835657119750977, 5.0910844802856445, 5.3465118408203125, 5.6019392013549805, 5.857366561889648]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 4.0, 6.0, 10.0, 10.0, 11.0, 10.0, 14.0, 19.0, 20.0, 29.0, 17.0, 27.0, 35.0, 33.0, 42.0, 40.0, 44.0, 36.0, 28.0, 39.0, 42.0, 44.0, 44.0, 42.0, 33.0, 32.0, 31.0, 27.0, 32.0, 22.0, 25.0, 22.0, 20.0, 15.0, 15.0, 12.0, 14.0, 7.0, 17.0, 1.0, 6.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8077805042266846, -2.7121710777282715, -2.6165616512298584, -2.5209522247314453, -2.4253427982330322, -2.329733371734619, -2.234124183654785, -2.138514518737793, -2.042905330657959, -1.947295904159546, -1.8516864776611328, -1.7560770511627197, -1.6604676246643066, -1.5648581981658936, -1.46924889087677, -1.373639464378357, -1.2780299186706543, -1.1824204921722412, -1.0868110656738281, -0.9912016987800598, -0.8955922722816467, -0.7999828457832336, -0.7043734788894653, -0.6087640523910522, -0.5131546258926392, -0.4175451993942261, -0.3219358026981354, -0.22632640600204468, -0.1307169795036316, -0.035107553005218506, 0.060501813888549805, 0.1561112403869629, 0.2517204284667969, 0.34732985496520996, 0.44293925166130066, 0.5385486483573914, 0.6341580748558044, 0.7297675013542175, 0.8253768682479858, 0.9209862947463989, 1.016595721244812, 1.112205147743225, 1.2078145742416382, 1.3034238815307617, 1.3990333080291748, 1.494642734527588, 1.590252161026001, 1.685861587524414, 1.7814710140228271, 1.8770804405212402, 1.9726898670196533, 2.0682992935180664, 2.1639087200164795, 2.2595181465148926, 2.3551273345947266, 2.4507369995117188, 2.5463461875915527, 2.641955614089966, 2.737565040588379, 2.833174467086792, 2.928783893585205, 3.024393320083618, 3.1200027465820312, 3.2156119346618652, 3.3112215995788574]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 10.0, 11.0, 18.0, 23.0, 33.0, 42.0, 91.0, 141.0, 208.0, 346.0, 608.0, 1115.0, 2034.0, 3746.0, 7032.0, 13489.0, 25649.0, 51137.0, 113790.0, 236496.0, 283107.0, 163006.0, 72681.0, 35076.0, 18059.0, 9497.0, 4996.0, 2727.0, 1447.0, 791.0, 417.0, 278.0, 158.0, 85.0, 62.0, 38.0, 24.0, 23.0, 15.0, 14.0, 5.0, 8.0, 8.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.5458984375, -1.500732421875, -1.45556640625, -1.410400390625, -1.365234375, -1.320068359375, -1.27490234375, -1.229736328125, -1.1845703125, -1.139404296875, -1.09423828125, -1.049072265625, -1.00390625, -0.958740234375, -0.91357421875, -0.868408203125, -0.8232421875, -0.778076171875, -0.73291015625, -0.687744140625, -0.642578125, -0.597412109375, -0.55224609375, -0.507080078125, -0.4619140625, -0.416748046875, -0.37158203125, -0.326416015625, -0.28125, -0.236083984375, -0.19091796875, -0.145751953125, -0.1005859375, -0.055419921875, -0.01025390625, 0.034912109375, 0.080078125, 0.125244140625, 0.17041015625, 0.215576171875, 0.2607421875, 0.305908203125, 0.35107421875, 0.396240234375, 0.44140625, 0.486572265625, 0.53173828125, 0.576904296875, 0.6220703125, 0.667236328125, 0.71240234375, 0.757568359375, 0.802734375, 0.847900390625, 0.89306640625, 0.938232421875, 0.9833984375, 1.028564453125, 1.07373046875, 1.118896484375, 1.1640625, 1.209228515625, 1.25439453125, 1.299560546875, 1.3447265625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 4.0, 6.0, 9.0, 8.0, 18.0, 20.0, 18.0, 21.0, 28.0, 35.0, 34.0, 40.0, 34.0, 37.0, 43.0, 42.0, 48.0, 46.0, 51.0, 52.0, 47.0, 56.0, 41.0, 45.0, 32.0, 30.0, 24.0, 17.0, 25.0, 17.0, 13.0, 14.0, 8.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.58349609375, -0.5666732788085938, -0.5498504638671875, -0.5330276489257812, -0.516204833984375, -0.49938201904296875, -0.4825592041015625, -0.46573638916015625, -0.44891357421875, -0.43209075927734375, -0.4152679443359375, -0.39844512939453125, -0.381622314453125, -0.36479949951171875, -0.3479766845703125, -0.33115386962890625, -0.3143310546875, -0.29750823974609375, -0.2806854248046875, -0.26386260986328125, -0.247039794921875, -0.23021697998046875, -0.2133941650390625, -0.19657135009765625, -0.17974853515625, -0.16292572021484375, -0.1461029052734375, -0.12928009033203125, -0.112457275390625, -0.09563446044921875, -0.0788116455078125, -0.06198883056640625, -0.045166015625, -0.02834320068359375, -0.0115203857421875, 0.00530242919921875, 0.022125244140625, 0.03894805908203125, 0.0557708740234375, 0.07259368896484375, 0.08941650390625, 0.10623931884765625, 0.1230621337890625, 0.13988494873046875, 0.156707763671875, 0.17353057861328125, 0.1903533935546875, 0.20717620849609375, 0.2239990234375, 0.24082183837890625, 0.2576446533203125, 0.27446746826171875, 0.291290283203125, 0.30811309814453125, 0.3249359130859375, 0.34175872802734375, 0.35858154296875, 0.37540435791015625, 0.3922271728515625, 0.40904998779296875, 0.425872802734375, 0.44269561767578125, 0.4595184326171875, 0.47634124755859375, 0.4931640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 16.0, 20.0, 15.0, 20.0, 32.0, 43.0, 58.0, 78.0, 117.0, 196.0, 305.0, 638.0, 1374.0, 3460.0, 8837.0, 23181.0, 61522.0, 172430.0, 367349.0, 259109.0, 93295.0, 34109.0, 13321.0, 5068.0, 1993.0, 863.0, 457.0, 221.0, 115.0, 93.0, 62.0, 39.0, 40.0, 19.0, 17.0, 16.0, 8.0, 6.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.861328125, -1.8061065673828125, -1.750885009765625, -1.6956634521484375, -1.64044189453125, -1.5852203369140625, -1.529998779296875, -1.4747772216796875, -1.4195556640625, -1.3643341064453125, -1.309112548828125, -1.2538909912109375, -1.19866943359375, -1.1434478759765625, -1.088226318359375, -1.0330047607421875, -0.977783203125, -0.9225616455078125, -0.867340087890625, -0.8121185302734375, -0.75689697265625, -0.7016754150390625, -0.646453857421875, -0.5912322998046875, -0.5360107421875, -0.4807891845703125, -0.425567626953125, -0.3703460693359375, -0.31512451171875, -0.2599029541015625, -0.204681396484375, -0.1494598388671875, -0.09423828125, -0.0390167236328125, 0.016204833984375, 0.0714263916015625, 0.12664794921875, 0.1818695068359375, 0.237091064453125, 0.2923126220703125, 0.3475341796875, 0.4027557373046875, 0.457977294921875, 0.5131988525390625, 0.56842041015625, 0.6236419677734375, 0.678863525390625, 0.7340850830078125, 0.789306640625, 0.8445281982421875, 0.899749755859375, 0.9549713134765625, 1.01019287109375, 1.0654144287109375, 1.120635986328125, 1.1758575439453125, 1.2310791015625, 1.2863006591796875, 1.341522216796875, 1.3967437744140625, 1.45196533203125, 1.5071868896484375, 1.562408447265625, 1.6176300048828125, 1.6728515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 13.0, 13.0, 11.0, 10.0, 15.0, 13.0, 20.0, 26.0, 19.0, 32.0, 29.0, 34.0, 37.0, 41.0, 49.0, 30.0, 34.0, 47.0, 32.0, 42.0, 34.0, 36.0, 28.0, 31.0, 32.0, 30.0, 27.0, 23.0, 16.0, 30.0, 17.0, 14.0, 18.0, 22.0, 21.0, 10.0, 10.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2412109375, -1.201324462890625, -1.16143798828125, -1.121551513671875, -1.0816650390625, -1.041778564453125, -1.00189208984375, -0.962005615234375, -0.922119140625, -0.882232666015625, -0.84234619140625, -0.802459716796875, -0.7625732421875, -0.722686767578125, -0.68280029296875, -0.642913818359375, -0.60302734375, -0.563140869140625, -0.52325439453125, -0.483367919921875, -0.4434814453125, -0.403594970703125, -0.36370849609375, -0.323822021484375, -0.283935546875, -0.244049072265625, -0.20416259765625, -0.164276123046875, -0.1243896484375, -0.084503173828125, -0.04461669921875, -0.004730224609375, 0.03515625, 0.075042724609375, 0.11492919921875, 0.154815673828125, 0.1947021484375, 0.234588623046875, 0.27447509765625, 0.314361572265625, 0.354248046875, 0.394134521484375, 0.43402099609375, 0.473907470703125, 0.5137939453125, 0.553680419921875, 0.59356689453125, 0.633453369140625, 0.67333984375, 0.713226318359375, 0.75311279296875, 0.792999267578125, 0.8328857421875, 0.872772216796875, 0.91265869140625, 0.952545166015625, 0.992431640625, 1.032318115234375, 1.07220458984375, 1.112091064453125, 1.1519775390625, 1.191864013671875, 1.23175048828125, 1.271636962890625, 1.3115234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 9.0, 12.0, 20.0, 26.0, 54.0, 91.0, 144.0, 234.0, 324.0, 652.0, 1144.0, 2059.0, 3763.0, 6780.0, 12031.0, 20953.0, 37554.0, 68929.0, 123811.0, 194560.0, 215353.0, 156962.0, 90643.0, 49561.0, 27591.0, 15379.0, 8675.0, 4885.0, 2629.0, 1579.0, 916.0, 477.0, 305.0, 174.0, 94.0, 70.0, 30.0, 30.0, 15.0, 8.0, 11.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.576171875, -0.5602684020996094, -0.5443649291992188, -0.5284614562988281, -0.5125579833984375, -0.4966545104980469, -0.48075103759765625, -0.4648475646972656, -0.448944091796875, -0.4330406188964844, -0.41713714599609375, -0.4012336730957031, -0.3853302001953125, -0.3694267272949219, -0.35352325439453125, -0.3376197814941406, -0.32171630859375, -0.3058128356933594, -0.28990936279296875, -0.2740058898925781, -0.2581024169921875, -0.24219894409179688, -0.22629547119140625, -0.21039199829101562, -0.194488525390625, -0.17858505249023438, -0.16268157958984375, -0.14677810668945312, -0.1308746337890625, -0.11497116088867188, -0.09906768798828125, -0.08316421508789062, -0.0672607421875, -0.051357269287109375, -0.03545379638671875, -0.019550323486328125, -0.0036468505859375, 0.012256622314453125, 0.02816009521484375, 0.044063568115234375, 0.059967041015625, 0.07587051391601562, 0.09177398681640625, 0.10767745971679688, 0.1235809326171875, 0.13948440551757812, 0.15538787841796875, 0.17129135131835938, 0.18719482421875, 0.20309829711914062, 0.21900177001953125, 0.23490524291992188, 0.2508087158203125, 0.2667121887207031, 0.28261566162109375, 0.2985191345214844, 0.314422607421875, 0.3303260803222656, 0.34622955322265625, 0.3621330261230469, 0.3780364990234375, 0.3939399719238281, 0.40984344482421875, 0.4257469177246094, 0.441650390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 13.0, 13.0, 22.0, 24.0, 23.0, 51.0, 58.0, 66.0, 94.0, 118.0, 107.0, 97.0, 71.0, 49.0, 50.0, 29.0, 23.0, 13.0, 13.0, 9.0, 7.0, 9.0, 6.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020575523376464844, -0.00020033493638038635, -0.00019491463899612427, -0.00018949434161186218, -0.0001840740442276001, -0.000178653746843338, -0.00017323344945907593, -0.00016781315207481384, -0.00016239285469055176, -0.00015697255730628967, -0.0001515522599220276, -0.0001461319625377655, -0.00014071166515350342, -0.00013529136776924133, -0.00012987107038497925, -0.00012445077300071716, -0.00011903047561645508, -0.00011361017823219299, -0.00010818988084793091, -0.00010276958346366882, -9.734928607940674e-05, -9.192898869514465e-05, -8.650869131088257e-05, -8.108839392662048e-05, -7.56680965423584e-05, -7.024779915809631e-05, -6.482750177383423e-05, -5.9407204389572144e-05, -5.398690700531006e-05, -4.8566609621047974e-05, -4.314631223678589e-05, -3.7726014852523804e-05, -3.230571746826172e-05, -2.6885420083999634e-05, -2.146512269973755e-05, -1.6044825315475464e-05, -1.0624527931213379e-05, -5.204230546951294e-06, 2.1606683731079102e-07, 5.636364221572876e-06, 1.1056661605834961e-05, 1.6476958990097046e-05, 2.189725637435913e-05, 2.7317553758621216e-05, 3.27378511428833e-05, 3.8158148527145386e-05, 4.357844591140747e-05, 4.8998743295669556e-05, 5.441904067993164e-05, 5.9839338064193726e-05, 6.525963544845581e-05, 7.06799328327179e-05, 7.610023021697998e-05, 8.152052760124207e-05, 8.694082498550415e-05, 9.236112236976624e-05, 9.778141975402832e-05, 0.0001032017171382904, 0.00010862201452255249, 0.00011404231190681458, 0.00011946260929107666, 0.00012488290667533875, 0.00013030320405960083, 0.00013572350144386292, 0.000141143798828125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 2.0, 7.0, 15.0, 14.0, 28.0, 35.0, 56.0, 87.0, 132.0, 225.0, 352.0, 604.0, 1182.0, 2200.0, 4424.0, 8847.0, 17532.0, 35444.0, 73051.0, 160325.0, 280863.0, 238636.0, 116816.0, 54140.0, 26704.0, 13201.0, 6550.0, 3390.0, 1604.0, 873.0, 478.0, 274.0, 165.0, 107.0, 78.0, 37.0, 25.0, 15.0, 15.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5432891845703125, -0.525054931640625, -0.5068206787109375, -0.48858642578125, -0.4703521728515625, -0.452117919921875, -0.4338836669921875, -0.4156494140625, -0.3974151611328125, -0.379180908203125, -0.3609466552734375, -0.34271240234375, -0.3244781494140625, -0.306243896484375, -0.2880096435546875, -0.269775390625, -0.2515411376953125, -0.233306884765625, -0.2150726318359375, -0.19683837890625, -0.1786041259765625, -0.160369873046875, -0.1421356201171875, -0.1239013671875, -0.1056671142578125, -0.087432861328125, -0.0691986083984375, -0.05096435546875, -0.0327301025390625, -0.014495849609375, 0.0037384033203125, 0.02197265625, 0.0402069091796875, 0.058441162109375, 0.0766754150390625, 0.09490966796875, 0.1131439208984375, 0.131378173828125, 0.1496124267578125, 0.1678466796875, 0.1860809326171875, 0.204315185546875, 0.2225494384765625, 0.24078369140625, 0.2590179443359375, 0.277252197265625, 0.2954864501953125, 0.313720703125, 0.3319549560546875, 0.350189208984375, 0.3684234619140625, 0.38665771484375, 0.4048919677734375, 0.423126220703125, 0.4413604736328125, 0.4595947265625, 0.4778289794921875, 0.496063232421875, 0.5142974853515625, 0.53253173828125, 0.5507659912109375, 0.569000244140625, 0.5872344970703125, 0.60546875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 5.0, 11.0, 17.0, 21.0, 26.0, 28.0, 32.0, 47.0, 38.0, 53.0, 80.0, 65.0, 71.0, 77.0, 81.0, 42.0, 59.0, 43.0, 36.0, 37.0, 26.0, 17.0, 19.0, 12.0, 10.0, 9.0, 5.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.61083984375, -0.5916900634765625, -0.572540283203125, -0.5533905029296875, -0.53424072265625, -0.5150909423828125, -0.495941162109375, -0.4767913818359375, -0.4576416015625, -0.4384918212890625, -0.419342041015625, -0.4001922607421875, -0.38104248046875, -0.3618927001953125, -0.342742919921875, -0.3235931396484375, -0.304443359375, -0.2852935791015625, -0.266143798828125, -0.2469940185546875, -0.22784423828125, -0.2086944580078125, -0.189544677734375, -0.1703948974609375, -0.1512451171875, -0.1320953369140625, -0.112945556640625, -0.0937957763671875, -0.07464599609375, -0.0554962158203125, -0.036346435546875, -0.0171966552734375, 0.001953125, 0.0211029052734375, 0.040252685546875, 0.0594024658203125, 0.07855224609375, 0.0977020263671875, 0.116851806640625, 0.1360015869140625, 0.1551513671875, 0.1743011474609375, 0.193450927734375, 0.2126007080078125, 0.23175048828125, 0.2509002685546875, 0.270050048828125, 0.2891998291015625, 0.308349609375, 0.3274993896484375, 0.346649169921875, 0.3657989501953125, 0.38494873046875, 0.4040985107421875, 0.423248291015625, 0.4423980712890625, 0.4615478515625, 0.4806976318359375, 0.499847412109375, 0.5189971923828125, 0.53814697265625, 0.5572967529296875, 0.576446533203125, 0.5955963134765625, 0.61474609375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 10.0, 22.0, 39.0, 58.0, 87.0, 102.0, 137.0, 104.0, 131.0, 100.0, 66.0, 53.0, 41.0, 23.0, 15.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.263677597045898, -10.009865760803223, -9.756053924560547, -9.502243041992188, -9.248431205749512, -8.994619369506836, -8.740808486938477, -8.4869966506958, -8.233184814453125, -7.979372978210449, -7.725561618804932, -7.471750259399414, -7.217938423156738, -6.9641265869140625, -6.710315227508545, -6.456503868103027, -6.202692031860352, -5.948880195617676, -5.695068836212158, -5.441257476806641, -5.187445640563965, -4.933633804321289, -4.6798224449157715, -4.426011085510254, -4.172199249267578, -3.9183876514434814, -3.6645760536193848, -3.410764455795288, -3.1569528579711914, -2.9031412601470947, -2.649329662322998, -2.3955180644989014, -2.1417064666748047, -1.887894868850708, -1.6340832710266113, -1.3802716732025146, -1.126460075378418, -0.8726484775543213, -0.6188368797302246, -0.36502528190612793, -0.11121368408203125, 0.14259791374206543, 0.3964095115661621, 0.6502211093902588, 0.9040327072143555, 1.1578443050384521, 1.4116559028625488, 1.6654675006866455, 1.9192790985107422, 2.173090696334839, 2.4269022941589355, 2.6807138919830322, 2.934525489807129, 3.1883370876312256, 3.4421486854553223, 3.695960283279419, 3.9497718811035156, 4.203583717346191, 4.457395076751709, 4.711206436157227, 4.965018272399902, 5.218830108642578, 5.472641468048096, 5.726452827453613, 5.980264663696289]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 4.0, 9.0, 11.0, 15.0, 16.0, 12.0, 16.0, 17.0, 34.0, 31.0, 35.0, 26.0, 36.0, 40.0, 40.0, 45.0, 47.0, 52.0, 37.0, 40.0, 47.0, 33.0, 51.0, 36.0, 35.0, 45.0, 24.0, 29.0, 18.0, 21.0, 13.0, 17.0, 10.0, 14.0, 10.0, 5.0, 10.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.538846969604492, -4.402700424194336, -4.26655387878418, -4.130407333374023, -3.994260787963867, -3.858114242553711, -3.7219676971435547, -3.5858211517333984, -3.449674606323242, -3.313528060913086, -3.1773815155029297, -3.0412349700927734, -2.905088424682617, -2.768941879272461, -2.6327953338623047, -2.4966487884521484, -2.360502243041992, -2.224355697631836, -2.0882091522216797, -1.9520626068115234, -1.8159160614013672, -1.679769515991211, -1.5436229705810547, -1.4074764251708984, -1.2713298797607422, -1.135183334350586, -0.9990367889404297, -0.8628902435302734, -0.7267436981201172, -0.5905971527099609, -0.4544506072998047, -0.31830406188964844, -0.1821575164794922, -0.04601097106933594, 0.09013557434082031, 0.22628211975097656, 0.3624286651611328, 0.49857521057128906, 0.6347217559814453, 0.7708683013916016, 0.9070148468017578, 1.043161392211914, 1.1793079376220703, 1.3154544830322266, 1.4516010284423828, 1.587747573852539, 1.7238941192626953, 1.8600406646728516, 1.9961872100830078, 2.132333755493164, 2.2684803009033203, 2.4046268463134766, 2.540773391723633, 2.676919937133789, 2.8130664825439453, 2.9492130279541016, 3.085359573364258, 3.221506118774414, 3.3576526641845703, 3.4937992095947266, 3.629945755004883, 3.766092300415039, 3.9022388458251953, 4.038385391235352, 4.174531936645508]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 5.0, 11.0, 17.0, 31.0, 45.0, 83.0, 142.0, 284.0, 556.0, 1168.0, 2569.0, 6169.0, 17306.0, 56259.0, 227913.0, 1117047.0, 2029512.0, 561854.0, 120993.0, 33421.0, 11226.0, 4366.0, 1764.0, 747.0, 385.0, 191.0, 110.0, 41.0, 21.0, 22.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2314453125, -1.195526123046875, -1.15960693359375, -1.123687744140625, -1.0877685546875, -1.051849365234375, -1.01593017578125, -0.980010986328125, -0.944091796875, -0.908172607421875, -0.87225341796875, -0.836334228515625, -0.8004150390625, -0.764495849609375, -0.72857666015625, -0.692657470703125, -0.65673828125, -0.620819091796875, -0.58489990234375, -0.548980712890625, -0.5130615234375, -0.477142333984375, -0.44122314453125, -0.405303955078125, -0.369384765625, -0.333465576171875, -0.29754638671875, -0.261627197265625, -0.2257080078125, -0.189788818359375, -0.15386962890625, -0.117950439453125, -0.08203125, -0.046112060546875, -0.01019287109375, 0.025726318359375, 0.0616455078125, 0.097564697265625, 0.13348388671875, 0.169403076171875, 0.205322265625, 0.241241455078125, 0.27716064453125, 0.313079833984375, 0.3489990234375, 0.384918212890625, 0.42083740234375, 0.456756591796875, 0.49267578125, 0.528594970703125, 0.56451416015625, 0.600433349609375, 0.6363525390625, 0.672271728515625, 0.70819091796875, 0.744110107421875, 0.780029296875, 0.815948486328125, 0.85186767578125, 0.887786865234375, 0.9237060546875, 0.959625244140625, 0.99554443359375, 1.031463623046875, 1.0673828125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 9.0, 7.0, 15.0, 18.0, 17.0, 24.0, 32.0, 43.0, 43.0, 32.0, 37.0, 55.0, 49.0, 64.0, 48.0, 60.0, 63.0, 45.0, 49.0, 57.0, 46.0, 33.0, 30.0, 22.0, 16.0, 20.0, 8.0, 18.0, 9.0, 9.0, 10.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7373046875, -0.7155303955078125, -0.693756103515625, -0.6719818115234375, -0.65020751953125, -0.6284332275390625, -0.606658935546875, -0.5848846435546875, -0.5631103515625, -0.5413360595703125, -0.519561767578125, -0.4977874755859375, -0.47601318359375, -0.4542388916015625, -0.432464599609375, -0.4106903076171875, -0.388916015625, -0.3671417236328125, -0.345367431640625, -0.3235931396484375, -0.30181884765625, -0.2800445556640625, -0.258270263671875, -0.2364959716796875, -0.2147216796875, -0.1929473876953125, -0.171173095703125, -0.1493988037109375, -0.12762451171875, -0.1058502197265625, -0.084075927734375, -0.0623016357421875, -0.04052734375, -0.0187530517578125, 0.003021240234375, 0.0247955322265625, 0.04656982421875, 0.0683441162109375, 0.090118408203125, 0.1118927001953125, 0.1336669921875, 0.1554412841796875, 0.177215576171875, 0.1989898681640625, 0.22076416015625, 0.2425384521484375, 0.264312744140625, 0.2860870361328125, 0.307861328125, 0.3296356201171875, 0.351409912109375, 0.3731842041015625, 0.39495849609375, 0.4167327880859375, 0.438507080078125, 0.4602813720703125, 0.4820556640625, 0.5038299560546875, 0.525604248046875, 0.5473785400390625, 0.56915283203125, 0.5909271240234375, 0.612701416015625, 0.6344757080078125, 0.65625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 13.0, 20.0, 29.0, 47.0, 75.0, 120.0, 177.0, 393.0, 665.0, 1332.0, 3130.0, 7939.0, 25500.0, 105094.0, 561318.0, 2164897.0, 1064791.0, 196278.0, 42061.0, 12177.0, 4377.0, 1919.0, 858.0, 413.0, 276.0, 168.0, 80.0, 52.0, 34.0, 20.0, 6.0, 11.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.9208984375, -1.86993408203125, -1.8189697265625, -1.76800537109375, -1.717041015625, -1.66607666015625, -1.6151123046875, -1.56414794921875, -1.51318359375, -1.46221923828125, -1.4112548828125, -1.36029052734375, -1.309326171875, -1.25836181640625, -1.2073974609375, -1.15643310546875, -1.10546875, -1.05450439453125, -1.0035400390625, -0.95257568359375, -0.901611328125, -0.85064697265625, -0.7996826171875, -0.74871826171875, -0.69775390625, -0.64678955078125, -0.5958251953125, -0.54486083984375, -0.493896484375, -0.44293212890625, -0.3919677734375, -0.34100341796875, -0.2900390625, -0.23907470703125, -0.1881103515625, -0.13714599609375, -0.086181640625, -0.03521728515625, 0.0157470703125, 0.06671142578125, 0.11767578125, 0.16864013671875, 0.2196044921875, 0.27056884765625, 0.321533203125, 0.37249755859375, 0.4234619140625, 0.47442626953125, 0.525390625, 0.57635498046875, 0.6273193359375, 0.67828369140625, 0.729248046875, 0.78021240234375, 0.8311767578125, 0.88214111328125, 0.93310546875, 0.98406982421875, 1.0350341796875, 1.08599853515625, 1.136962890625, 1.18792724609375, 1.2388916015625, 1.28985595703125, 1.3408203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 10.0, 20.0, 34.0, 28.0, 55.0, 87.0, 127.0, 183.0, 272.0, 371.0, 480.0, 518.0, 481.0, 392.0, 289.0, 215.0, 172.0, 98.0, 78.0, 50.0, 27.0, 21.0, 16.0, 7.0, 11.0, 5.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.35546875, -1.3114013671875, -1.267333984375, -1.2232666015625, -1.17919921875, -1.1351318359375, -1.091064453125, -1.0469970703125, -1.0029296875, -0.9588623046875, -0.914794921875, -0.8707275390625, -0.82666015625, -0.7825927734375, -0.738525390625, -0.6944580078125, -0.650390625, -0.6063232421875, -0.562255859375, -0.5181884765625, -0.47412109375, -0.4300537109375, -0.385986328125, -0.3419189453125, -0.2978515625, -0.2537841796875, -0.209716796875, -0.1656494140625, -0.12158203125, -0.0775146484375, -0.033447265625, 0.0106201171875, 0.0546875, 0.0987548828125, 0.142822265625, 0.1868896484375, 0.23095703125, 0.2750244140625, 0.319091796875, 0.3631591796875, 0.4072265625, 0.4512939453125, 0.495361328125, 0.5394287109375, 0.58349609375, 0.6275634765625, 0.671630859375, 0.7156982421875, 0.759765625, 0.8038330078125, 0.847900390625, 0.8919677734375, 0.93603515625, 0.9801025390625, 1.024169921875, 1.0682373046875, 1.1123046875, 1.1563720703125, 1.200439453125, 1.2445068359375, 1.28857421875, 1.3326416015625, 1.376708984375, 1.4207763671875, 1.46484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 9.0, 11.0, 13.0, 12.0, 31.0, 37.0, 57.0, 67.0, 77.0, 81.0, 86.0, 99.0, 63.0, 78.0, 76.0, 60.0, 50.0, 33.0, 21.0, 9.0, 12.0, 9.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0], "bins": [-9.641374588012695, -9.441437721252441, -9.241500854492188, -9.041563987731934, -8.84162712097168, -8.641690254211426, -8.441753387451172, -8.241816520690918, -8.041879653930664, -7.84194278717041, -7.642005920410156, -7.442069053649902, -7.242132186889648, -7.0421953201293945, -6.842258453369141, -6.642321586608887, -6.442384243011475, -6.242447376251221, -6.042510509490967, -5.842573642730713, -5.642636775970459, -5.442699909210205, -5.242762565612793, -5.042825698852539, -4.842888832092285, -4.642951965332031, -4.443015098571777, -4.243078231811523, -4.0431413650512695, -3.8432044982910156, -3.6432673931121826, -3.4433305263519287, -3.2433934211730957, -3.043456554412842, -2.843519687652588, -2.643582820892334, -2.44364595413208, -2.243709087371826, -2.043771982192993, -1.8438351154327393, -1.6438982486724854, -1.4439613819122314, -1.2440245151519775, -1.044087529182434, -0.8441506624221802, -0.6442137956619263, -0.4442768096923828, -0.2443399429321289, -0.044403076171875, 0.1555338203907013, 0.3554707169532776, 0.5554076433181763, 0.7553445100784302, 0.9552813768386841, 1.1552183628082275, 1.3551552295684814, 1.5550920963287354, 1.7550289630889893, 1.9549658298492432, 2.154902935028076, 2.35483980178833, 2.554776668548584, 2.754713535308838, 2.954650402069092, 3.1545872688293457]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 17.0, 6.0, 10.0, 16.0, 16.0, 15.0, 23.0, 19.0, 20.0, 24.0, 24.0, 24.0, 43.0, 41.0, 47.0, 32.0, 39.0, 36.0, 49.0, 40.0, 44.0, 41.0, 40.0, 37.0, 27.0, 40.0, 25.0, 21.0, 26.0, 25.0, 9.0, 19.0, 18.0, 19.0, 15.0, 9.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078807830810547, -3.948406219482422, -3.818004846572876, -3.687603235244751, -3.557201862335205, -3.42680025100708, -3.296398639678955, -3.165997266769409, -3.0355958938598633, -2.9051942825317383, -2.7747929096221924, -2.6443912982940674, -2.5139899253845215, -2.3835883140563965, -2.2531867027282715, -2.1227853298187256, -1.9923837184906006, -1.8619822263717651, -1.7315807342529297, -1.6011791229248047, -1.4707777500152588, -1.3403761386871338, -1.2099746465682983, -1.079573154449463, -0.9491716623306274, -0.818770170211792, -0.6883686780929565, -0.5579671263694763, -0.42756563425064087, -0.2971641421318054, -0.1667625904083252, -0.036361098289489746, 0.0940403938293457, 0.22444190084934235, 0.354843407869339, 0.4852449297904968, 0.6156464219093323, 0.7460479140281677, 0.876449465751648, 1.0068509578704834, 1.1372524499893188, 1.2676539421081543, 1.3980554342269897, 1.5284569263458252, 1.6588585376739502, 1.789259910583496, 1.919661521911621, 2.050063133239746, 2.180464506149292, 2.310866117477417, 2.441267490386963, 2.571669101715088, 2.702070474624634, 2.832472085952759, 2.9628734588623047, 3.0932750701904297, 3.2236766815185547, 3.3540782928466797, 3.4844796657562256, 3.6148812770843506, 3.7452826499938965, 3.8756842613220215, 4.0060858726501465, 4.136487007141113, 4.266888618469238]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 6.0, 7.0, 8.0, 25.0, 19.0, 39.0, 48.0, 66.0, 150.0, 255.0, 456.0, 708.0, 1421.0, 2677.0, 5227.0, 10159.0, 19055.0, 36468.0, 73039.0, 145273.0, 245780.0, 235437.0, 134180.0, 67015.0, 34065.0, 17529.0, 9078.0, 4741.0, 2541.0, 1342.0, 736.0, 385.0, 232.0, 147.0, 92.0, 51.0, 33.0, 18.0, 20.0, 8.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3142852783203125, -1.267242431640625, -1.2201995849609375, -1.17315673828125, -1.1261138916015625, -1.079071044921875, -1.0320281982421875, -0.9849853515625, -0.9379425048828125, -0.890899658203125, -0.8438568115234375, -0.79681396484375, -0.7497711181640625, -0.702728271484375, -0.6556854248046875, -0.608642578125, -0.5615997314453125, -0.514556884765625, -0.4675140380859375, -0.42047119140625, -0.3734283447265625, -0.326385498046875, -0.2793426513671875, -0.2322998046875, -0.1852569580078125, -0.138214111328125, -0.0911712646484375, -0.04412841796875, 0.0029144287109375, 0.049957275390625, 0.0970001220703125, 0.14404296875, 0.1910858154296875, 0.238128662109375, 0.2851715087890625, 0.33221435546875, 0.3792572021484375, 0.426300048828125, 0.4733428955078125, 0.5203857421875, 0.5674285888671875, 0.614471435546875, 0.6615142822265625, 0.70855712890625, 0.7555999755859375, 0.802642822265625, 0.8496856689453125, 0.896728515625, 0.9437713623046875, 0.990814208984375, 1.0378570556640625, 1.08489990234375, 1.1319427490234375, 1.178985595703125, 1.2260284423828125, 1.2730712890625, 1.3201141357421875, 1.367156982421875, 1.4141998291015625, 1.46124267578125, 1.5082855224609375, 1.555328369140625, 1.6023712158203125, 1.6494140625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 9.0, 23.0, 20.0, 21.0, 16.0, 25.0, 37.0, 35.0, 42.0, 49.0, 46.0, 36.0, 47.0, 48.0, 55.0, 62.0, 42.0, 55.0, 42.0, 34.0, 45.0, 29.0, 31.0, 24.0, 19.0, 18.0, 14.0, 10.0, 8.0, 7.0, 5.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7431640625, -0.722015380859375, -0.70086669921875, -0.679718017578125, -0.6585693359375, -0.637420654296875, -0.61627197265625, -0.595123291015625, -0.573974609375, -0.552825927734375, -0.53167724609375, -0.510528564453125, -0.4893798828125, -0.468231201171875, -0.44708251953125, -0.425933837890625, -0.40478515625, -0.383636474609375, -0.36248779296875, -0.341339111328125, -0.3201904296875, -0.299041748046875, -0.27789306640625, -0.256744384765625, -0.235595703125, -0.214447021484375, -0.19329833984375, -0.172149658203125, -0.1510009765625, -0.129852294921875, -0.10870361328125, -0.087554931640625, -0.06640625, -0.045257568359375, -0.02410888671875, -0.002960205078125, 0.0181884765625, 0.039337158203125, 0.06048583984375, 0.081634521484375, 0.102783203125, 0.123931884765625, 0.14508056640625, 0.166229248046875, 0.1873779296875, 0.208526611328125, 0.22967529296875, 0.250823974609375, 0.27197265625, 0.293121337890625, 0.31427001953125, 0.335418701171875, 0.3565673828125, 0.377716064453125, 0.39886474609375, 0.420013427734375, 0.441162109375, 0.462310791015625, 0.48345947265625, 0.504608154296875, 0.5257568359375, 0.546905517578125, 0.56805419921875, 0.589202880859375, 0.6103515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 9.0, 19.0, 26.0, 50.0, 72.0, 111.0, 208.0, 435.0, 965.0, 2222.0, 5457.0, 14068.0, 36125.0, 94437.0, 245040.0, 351909.0, 184751.0, 68870.0, 26096.0, 10447.0, 4108.0, 1647.0, 703.0, 340.0, 156.0, 106.0, 45.0, 32.0, 31.0, 16.0, 11.0, 7.0, 5.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.011810302734375, -1.94549560546875, -1.879180908203125, -1.8128662109375, -1.746551513671875, -1.68023681640625, -1.613922119140625, -1.547607421875, -1.481292724609375, -1.41497802734375, -1.348663330078125, -1.2823486328125, -1.216033935546875, -1.14971923828125, -1.083404541015625, -1.01708984375, -0.950775146484375, -0.88446044921875, -0.818145751953125, -0.7518310546875, -0.685516357421875, -0.61920166015625, -0.552886962890625, -0.486572265625, -0.420257568359375, -0.35394287109375, -0.287628173828125, -0.2213134765625, -0.154998779296875, -0.08868408203125, -0.022369384765625, 0.0439453125, 0.110260009765625, 0.17657470703125, 0.242889404296875, 0.3092041015625, 0.375518798828125, 0.44183349609375, 0.508148193359375, 0.574462890625, 0.640777587890625, 0.70709228515625, 0.773406982421875, 0.8397216796875, 0.906036376953125, 0.97235107421875, 1.038665771484375, 1.10498046875, 1.171295166015625, 1.23760986328125, 1.303924560546875, 1.3702392578125, 1.436553955078125, 1.50286865234375, 1.569183349609375, 1.635498046875, 1.701812744140625, 1.76812744140625, 1.834442138671875, 1.9007568359375, 1.967071533203125, 2.03338623046875, 2.099700927734375, 2.166015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 3.0, 10.0, 9.0, 13.0, 15.0, 11.0, 20.0, 28.0, 27.0, 40.0, 41.0, 51.0, 57.0, 41.0, 42.0, 47.0, 58.0, 45.0, 31.0, 47.0, 51.0, 43.0, 38.0, 38.0, 31.0, 27.0, 19.0, 27.0, 16.0, 14.0, 12.0, 11.0, 9.0, 3.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.638671875, -1.575653076171875, -1.51263427734375, -1.449615478515625, -1.3865966796875, -1.323577880859375, -1.26055908203125, -1.197540283203125, -1.134521484375, -1.071502685546875, -1.00848388671875, -0.945465087890625, -0.8824462890625, -0.819427490234375, -0.75640869140625, -0.693389892578125, -0.63037109375, -0.567352294921875, -0.50433349609375, -0.441314697265625, -0.3782958984375, -0.315277099609375, -0.25225830078125, -0.189239501953125, -0.126220703125, -0.063201904296875, -0.00018310546875, 0.062835693359375, 0.1258544921875, 0.188873291015625, 0.25189208984375, 0.314910888671875, 0.3779296875, 0.440948486328125, 0.50396728515625, 0.566986083984375, 0.6300048828125, 0.693023681640625, 0.75604248046875, 0.819061279296875, 0.882080078125, 0.945098876953125, 1.00811767578125, 1.071136474609375, 1.1341552734375, 1.197174072265625, 1.26019287109375, 1.323211669921875, 1.38623046875, 1.449249267578125, 1.51226806640625, 1.575286865234375, 1.6383056640625, 1.701324462890625, 1.76434326171875, 1.827362060546875, 1.890380859375, 1.953399658203125, 2.01641845703125, 2.079437255859375, 2.1424560546875, 2.205474853515625, 2.26849365234375, 2.331512451171875, 2.39453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 5.0, 13.0, 17.0, 30.0, 45.0, 62.0, 94.0, 153.0, 258.0, 390.0, 649.0, 1012.0, 1586.0, 2657.0, 4647.0, 8280.0, 15455.0, 29270.0, 55455.0, 104676.0, 180962.0, 229682.0, 184216.0, 106924.0, 56423.0, 29487.0, 15479.0, 8694.0, 4740.0, 2768.0, 1662.0, 951.0, 637.0, 417.0, 271.0, 159.0, 99.0, 78.0, 54.0, 38.0, 23.0, 9.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.677734375, -0.656890869140625, -0.63604736328125, -0.615203857421875, -0.5943603515625, -0.573516845703125, -0.55267333984375, -0.531829833984375, -0.510986328125, -0.490142822265625, -0.46929931640625, -0.448455810546875, -0.4276123046875, -0.406768798828125, -0.38592529296875, -0.365081787109375, -0.34423828125, -0.323394775390625, -0.30255126953125, -0.281707763671875, -0.2608642578125, -0.240020751953125, -0.21917724609375, -0.198333740234375, -0.177490234375, -0.156646728515625, -0.13580322265625, -0.114959716796875, -0.0941162109375, -0.073272705078125, -0.05242919921875, -0.031585693359375, -0.0107421875, 0.010101318359375, 0.03094482421875, 0.051788330078125, 0.0726318359375, 0.093475341796875, 0.11431884765625, 0.135162353515625, 0.156005859375, 0.176849365234375, 0.19769287109375, 0.218536376953125, 0.2393798828125, 0.260223388671875, 0.28106689453125, 0.301910400390625, 0.32275390625, 0.343597412109375, 0.36444091796875, 0.385284423828125, 0.4061279296875, 0.426971435546875, 0.44781494140625, 0.468658447265625, 0.489501953125, 0.510345458984375, 0.53118896484375, 0.552032470703125, 0.5728759765625, 0.593719482421875, 0.61456298828125, 0.635406494140625, 0.65625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 8.0, 8.0, 4.0, 7.0, 9.0, 20.0, 12.0, 22.0, 18.0, 28.0, 35.0, 40.0, 54.0, 61.0, 57.0, 97.0, 91.0, 71.0, 69.0, 63.0, 49.0, 34.0, 28.0, 20.0, 13.0, 12.0, 11.0, 10.0, 11.0, 11.0, 9.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001990795135498047, -0.00019340217113494873, -0.00018772482872009277, -0.00018204748630523682, -0.00017637014389038086, -0.0001706928014755249, -0.00016501545906066895, -0.000159338116645813, -0.00015366077423095703, -0.00014798343181610107, -0.00014230608940124512, -0.00013662874698638916, -0.0001309514045715332, -0.00012527406215667725, -0.00011959671974182129, -0.00011391937732696533, -0.00010824203491210938, -0.00010256469249725342, -9.688735008239746e-05, -9.12100076675415e-05, -8.553266525268555e-05, -7.985532283782959e-05, -7.417798042297363e-05, -6.850063800811768e-05, -6.282329559326172e-05, -5.714595317840576e-05, -5.1468610763549805e-05, -4.579126834869385e-05, -4.011392593383789e-05, -3.4436583518981934e-05, -2.8759241104125977e-05, -2.308189868927002e-05, -1.7404556274414062e-05, -1.1727213859558105e-05, -6.0498714447021484e-06, -3.725290298461914e-07, 5.304813385009766e-06, 1.0982155799865723e-05, 1.665949821472168e-05, 2.2336840629577637e-05, 2.8014183044433594e-05, 3.369152545928955e-05, 3.936886787414551e-05, 4.5046210289001465e-05, 5.072355270385742e-05, 5.640089511871338e-05, 6.207823753356934e-05, 6.775557994842529e-05, 7.343292236328125e-05, 7.911026477813721e-05, 8.478760719299316e-05, 9.046494960784912e-05, 9.614229202270508e-05, 0.00010181963443756104, 0.00010749697685241699, 0.00011317431926727295, 0.0001188516616821289, 0.00012452900409698486, 0.00013020634651184082, 0.00013588368892669678, 0.00014156103134155273, 0.0001472383737564087, 0.00015291571617126465, 0.0001585930585861206, 0.00016427040100097656]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 12.0, 10.0, 16.0, 24.0, 36.0, 54.0, 76.0, 148.0, 247.0, 411.0, 685.0, 1287.0, 2263.0, 4327.0, 8347.0, 16775.0, 35347.0, 77042.0, 160526.0, 262753.0, 235182.0, 127876.0, 59515.0, 27758.0, 13382.0, 6636.0, 3462.0, 1843.0, 1029.0, 564.0, 343.0, 198.0, 127.0, 88.0, 60.0, 37.0, 21.0, 16.0, 6.0, 12.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.82763671875, -0.8038787841796875, -0.780120849609375, -0.7563629150390625, -0.73260498046875, -0.7088470458984375, -0.685089111328125, -0.6613311767578125, -0.6375732421875, -0.6138153076171875, -0.590057373046875, -0.5662994384765625, -0.54254150390625, -0.5187835693359375, -0.495025634765625, -0.4712677001953125, -0.447509765625, -0.4237518310546875, -0.399993896484375, -0.3762359619140625, -0.35247802734375, -0.3287200927734375, -0.304962158203125, -0.2812042236328125, -0.2574462890625, -0.2336883544921875, -0.209930419921875, -0.1861724853515625, -0.16241455078125, -0.1386566162109375, -0.114898681640625, -0.0911407470703125, -0.0673828125, -0.0436248779296875, -0.019866943359375, 0.0038909912109375, 0.02764892578125, 0.0514068603515625, 0.075164794921875, 0.0989227294921875, 0.1226806640625, 0.1464385986328125, 0.170196533203125, 0.1939544677734375, 0.21771240234375, 0.2414703369140625, 0.265228271484375, 0.2889862060546875, 0.312744140625, 0.3365020751953125, 0.360260009765625, 0.3840179443359375, 0.40777587890625, 0.4315338134765625, 0.455291748046875, 0.4790496826171875, 0.5028076171875, 0.5265655517578125, 0.550323486328125, 0.5740814208984375, 0.59783935546875, 0.6215972900390625, 0.645355224609375, 0.6691131591796875, 0.69287109375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 0.0, 2.0, 5.0, 6.0, 9.0, 14.0, 14.0, 17.0, 23.0, 26.0, 30.0, 40.0, 46.0, 74.0, 69.0, 91.0, 84.0, 75.0, 74.0, 51.0, 47.0, 46.0, 41.0, 24.0, 18.0, 20.0, 9.0, 8.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.8323593139648438, -0.8038787841796875, -0.7753982543945312, -0.746917724609375, -0.7184371948242188, -0.6899566650390625, -0.6614761352539062, -0.63299560546875, -0.6045150756835938, -0.5760345458984375, -0.5475540161132812, -0.519073486328125, -0.49059295654296875, -0.4621124267578125, -0.43363189697265625, -0.4051513671875, -0.37667083740234375, -0.3481903076171875, -0.31970977783203125, -0.291229248046875, -0.26274871826171875, -0.2342681884765625, -0.20578765869140625, -0.17730712890625, -0.14882659912109375, -0.1203460693359375, -0.09186553955078125, -0.063385009765625, -0.03490447998046875, -0.0064239501953125, 0.02205657958984375, 0.050537109375, 0.07901763916015625, 0.1074981689453125, 0.13597869873046875, 0.164459228515625, 0.19293975830078125, 0.2214202880859375, 0.24990081787109375, 0.27838134765625, 0.30686187744140625, 0.3353424072265625, 0.36382293701171875, 0.392303466796875, 0.42078399658203125, 0.4492645263671875, 0.47774505615234375, 0.5062255859375, 0.5347061157226562, 0.5631866455078125, 0.5916671752929688, 0.620147705078125, 0.6486282348632812, 0.6771087646484375, 0.7055892944335938, 0.73406982421875, 0.7625503540039062, 0.7910308837890625, 0.8195114135742188, 0.847991943359375, 0.8764724731445312, 0.9049530029296875, 0.9334335327148438, 0.9619140625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 31.0, 31.0, 46.0, 65.0, 73.0, 93.0, 104.0, 101.0, 90.0, 83.0, 72.0, 65.0, 46.0, 39.0, 20.0, 13.0, 9.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.832776069641113, -8.563865661621094, -8.294955253601074, -8.026044845581055, -7.757134437561035, -7.488224029541016, -7.219313621520996, -6.950403213500977, -6.681492805480957, -6.4125823974609375, -6.143671989440918, -5.874761581420898, -5.605851173400879, -5.336940765380859, -5.06803035736084, -4.79911994934082, -4.530209541320801, -4.261299133300781, -3.9923887252807617, -3.723478317260742, -3.4545679092407227, -3.185657501220703, -2.9167470932006836, -2.647836685180664, -2.3789262771606445, -2.110015869140625, -1.8411054611206055, -1.572195053100586, -1.3032846450805664, -1.0343742370605469, -0.7654638290405273, -0.4965534210205078, -0.2276439666748047, 0.041266441345214844, 0.3101768493652344, 0.5790872573852539, 0.8479976654052734, 1.116908073425293, 1.3858184814453125, 1.654728889465332, 1.9236392974853516, 2.192549705505371, 2.4614601135253906, 2.73037052154541, 2.9992809295654297, 3.268191337585449, 3.5371017456054688, 3.8060121536254883, 4.074922561645508, 4.343832969665527, 4.612743377685547, 4.881653785705566, 5.150564193725586, 5.4194746017456055, 5.688385009765625, 5.9572954177856445, 6.226205825805664, 6.495116233825684, 6.764026641845703, 7.032937049865723, 7.301847457885742, 7.570757865905762, 7.839668273925781, 8.1085786819458, 8.37748908996582]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 4.0, 8.0, 12.0, 8.0, 11.0, 14.0, 14.0, 16.0, 16.0, 26.0, 26.0, 24.0, 23.0, 37.0, 30.0, 35.0, 39.0, 33.0, 35.0, 44.0, 25.0, 33.0, 29.0, 40.0, 31.0, 42.0, 28.0, 34.0, 31.0, 27.0, 34.0, 23.0, 25.0, 16.0, 20.0, 22.0, 20.0, 12.0, 8.0, 11.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.624483108520508, -4.483680248260498, -4.342877388000488, -4.2020745277404785, -4.061271667480469, -3.920468807220459, -3.779665946960449, -3.6388630867004395, -3.4980602264404297, -3.35725736618042, -3.21645450592041, -3.0756516456604004, -2.9348487854003906, -2.794045925140381, -2.653243064880371, -2.5124402046203613, -2.3716371059417725, -2.2308342456817627, -2.090031385421753, -1.9492285251617432, -1.8084256649017334, -1.6676228046417236, -1.5268198251724243, -1.3860169649124146, -1.2452141046524048, -1.104411244392395, -0.9636083841323853, -0.8228054642677307, -0.682002604007721, -0.5411997437477112, -0.40039682388305664, -0.2595939636230469, -0.11879110336303711, 0.02201177179813385, 0.1628146469593048, 0.30361753702163696, 0.44442039728164673, 0.5852232575416565, 0.726026177406311, 0.8668290376663208, 1.0076318979263306, 1.1484347581863403, 1.28923761844635, 1.4300405979156494, 1.5708434581756592, 1.711646318435669, 1.8524491786956787, 1.9932520389556885, 2.1340548992156982, 2.274857759475708, 2.4156606197357178, 2.5564634799957275, 2.6972663402557373, 2.838069200515747, 2.978872299194336, 3.1196751594543457, 3.2604780197143555, 3.4012808799743652, 3.542083740234375, 3.6828866004943848, 3.8236894607543945, 3.9644923210144043, 4.105295181274414, 4.246098041534424, 4.386900901794434]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 10.0, 5.0, 8.0, 17.0, 33.0, 42.0, 56.0, 65.0, 121.0, 213.0, 351.0, 590.0, 1097.0, 2165.0, 4718.0, 10741.0, 27506.0, 76861.0, 242984.0, 896205.0, 1964504.0, 675976.0, 189423.0, 61480.0, 22367.0, 9102.0, 3796.0, 1763.0, 880.0, 481.0, 289.0, 143.0, 98.0, 65.0, 38.0, 32.0, 12.0, 15.0, 9.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3056640625, -1.2697906494140625, -1.233917236328125, -1.1980438232421875, -1.16217041015625, -1.1262969970703125, -1.090423583984375, -1.0545501708984375, -1.0186767578125, -0.9828033447265625, -0.946929931640625, -0.9110565185546875, -0.87518310546875, -0.8393096923828125, -0.803436279296875, -0.7675628662109375, -0.731689453125, -0.6958160400390625, -0.659942626953125, -0.6240692138671875, -0.58819580078125, -0.5523223876953125, -0.516448974609375, -0.4805755615234375, -0.4447021484375, -0.4088287353515625, -0.372955322265625, -0.3370819091796875, -0.30120849609375, -0.2653350830078125, -0.229461669921875, -0.1935882568359375, -0.15771484375, -0.1218414306640625, -0.085968017578125, -0.0500946044921875, -0.01422119140625, 0.0216522216796875, 0.057525634765625, 0.0933990478515625, 0.1292724609375, 0.1651458740234375, 0.201019287109375, 0.2368927001953125, 0.27276611328125, 0.3086395263671875, 0.344512939453125, 0.3803863525390625, 0.416259765625, 0.4521331787109375, 0.488006591796875, 0.5238800048828125, 0.55975341796875, 0.5956268310546875, 0.631500244140625, 0.6673736572265625, 0.7032470703125, 0.7391204833984375, 0.774993896484375, 0.8108673095703125, 0.84674072265625, 0.8826141357421875, 0.918487548828125, 0.9543609619140625, 0.990234375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 5.0, 20.0, 23.0, 23.0, 26.0, 22.0, 26.0, 26.0, 36.0, 34.0, 56.0, 48.0, 67.0, 44.0, 51.0, 44.0, 35.0, 46.0, 35.0, 50.0, 32.0, 36.0, 42.0, 22.0, 25.0, 18.0, 17.0, 12.0, 7.0, 8.0, 8.0, 8.0, 8.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.779296875, -0.7573776245117188, -0.7354583740234375, -0.7135391235351562, -0.691619873046875, -0.6697006225585938, -0.6477813720703125, -0.6258621215820312, -0.60394287109375, -0.5820236206054688, -0.5601043701171875, -0.5381851196289062, -0.516265869140625, -0.49434661865234375, -0.4724273681640625, -0.45050811767578125, -0.4285888671875, -0.40666961669921875, -0.3847503662109375, -0.36283111572265625, -0.340911865234375, -0.31899261474609375, -0.2970733642578125, -0.27515411376953125, -0.25323486328125, -0.23131561279296875, -0.2093963623046875, -0.18747711181640625, -0.165557861328125, -0.14363861083984375, -0.1217193603515625, -0.09980010986328125, -0.077880859375, -0.05596160888671875, -0.0340423583984375, -0.01212310791015625, 0.009796142578125, 0.03171539306640625, 0.0536346435546875, 0.07555389404296875, 0.09747314453125, 0.11939239501953125, 0.1413116455078125, 0.16323089599609375, 0.185150146484375, 0.20706939697265625, 0.2289886474609375, 0.25090789794921875, 0.2728271484375, 0.29474639892578125, 0.3166656494140625, 0.33858489990234375, 0.360504150390625, 0.38242340087890625, 0.4043426513671875, 0.42626190185546875, 0.44818115234375, 0.47010040283203125, 0.4920196533203125, 0.5139389038085938, 0.535858154296875, 0.5577774047851562, 0.5796966552734375, 0.6016159057617188, 0.62353515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 9.0, 7.0, 9.0, 12.0, 28.0, 36.0, 54.0, 91.0, 164.0, 273.0, 423.0, 817.0, 1598.0, 3523.0, 8442.0, 23320.0, 76251.0, 306394.0, 1383675.0, 1810855.0, 428071.0, 101657.0, 29933.0, 10397.0, 4131.0, 1925.0, 954.0, 518.0, 249.0, 162.0, 113.0, 52.0, 39.0, 36.0, 21.0, 13.0, 3.0, 9.0, 6.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7578125, -1.695281982421875, -1.63275146484375, -1.570220947265625, -1.5076904296875, -1.445159912109375, -1.38262939453125, -1.320098876953125, -1.257568359375, -1.195037841796875, -1.13250732421875, -1.069976806640625, -1.0074462890625, -0.944915771484375, -0.88238525390625, -0.819854736328125, -0.75732421875, -0.694793701171875, -0.63226318359375, -0.569732666015625, -0.5072021484375, -0.444671630859375, -0.38214111328125, -0.319610595703125, -0.257080078125, -0.194549560546875, -0.13201904296875, -0.069488525390625, -0.0069580078125, 0.055572509765625, 0.11810302734375, 0.180633544921875, 0.2431640625, 0.305694580078125, 0.36822509765625, 0.430755615234375, 0.4932861328125, 0.555816650390625, 0.61834716796875, 0.680877685546875, 0.743408203125, 0.805938720703125, 0.86846923828125, 0.930999755859375, 0.9935302734375, 1.056060791015625, 1.11859130859375, 1.181121826171875, 1.24365234375, 1.306182861328125, 1.36871337890625, 1.431243896484375, 1.4937744140625, 1.556304931640625, 1.61883544921875, 1.681365966796875, 1.743896484375, 1.806427001953125, 1.86895751953125, 1.931488037109375, 1.9940185546875, 2.056549072265625, 2.11907958984375, 2.181610107421875, 2.244140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 7.0, 8.0, 17.0, 19.0, 35.0, 51.0, 66.0, 84.0, 130.0, 222.0, 268.0, 377.0, 521.0, 619.0, 473.0, 346.0, 259.0, 186.0, 117.0, 89.0, 56.0, 38.0, 30.0, 19.0, 10.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.5093536376953125, -1.454254150390625, -1.3991546630859375, -1.34405517578125, -1.2889556884765625, -1.233856201171875, -1.1787567138671875, -1.1236572265625, -1.0685577392578125, -1.013458251953125, -0.9583587646484375, -0.90325927734375, -0.8481597900390625, -0.793060302734375, -0.7379608154296875, -0.682861328125, -0.6277618408203125, -0.572662353515625, -0.5175628662109375, -0.46246337890625, -0.4073638916015625, -0.352264404296875, -0.2971649169921875, -0.2420654296875, -0.1869659423828125, -0.131866455078125, -0.0767669677734375, -0.02166748046875, 0.0334320068359375, 0.088531494140625, 0.1436309814453125, 0.19873046875, 0.2538299560546875, 0.308929443359375, 0.3640289306640625, 0.41912841796875, 0.4742279052734375, 0.529327392578125, 0.5844268798828125, 0.6395263671875, 0.6946258544921875, 0.749725341796875, 0.8048248291015625, 0.85992431640625, 0.9150238037109375, 0.970123291015625, 1.0252227783203125, 1.080322265625, 1.1354217529296875, 1.190521240234375, 1.2456207275390625, 1.30072021484375, 1.3558197021484375, 1.410919189453125, 1.4660186767578125, 1.5211181640625, 1.5762176513671875, 1.631317138671875, 1.6864166259765625, 1.74151611328125, 1.7966156005859375, 1.851715087890625, 1.9068145751953125, 1.9619140625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 6.0, 20.0, 20.0, 29.0, 58.0, 69.0, 67.0, 89.0, 91.0, 114.0, 82.0, 80.0, 71.0, 68.0, 45.0, 24.0, 21.0, 14.0, 10.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5529046058654785, -7.2928547859191895, -7.032805442810059, -6.7727556228637695, -6.512706279754639, -6.25265645980835, -5.992607116699219, -5.73255729675293, -5.472507476806641, -5.212457656860352, -4.952408313751221, -4.692358493804932, -4.432309150695801, -4.172259330749512, -3.9122097492218018, -3.652160167694092, -3.392110824584961, -3.132061243057251, -2.872011661529541, -2.611961841583252, -2.351912498474121, -2.091862678527832, -1.831813097000122, -1.571763515472412, -1.3117139339447021, -1.0516643524169922, -0.7916147112846375, -0.5315650701522827, -0.27151548862457275, -0.011465907096862793, 0.24858379364013672, 0.5086333751678467, 0.7686834335327148, 1.0287330150604248, 1.2887825965881348, 1.5488322973251343, 1.8088818788528442, 2.0689315795898438, 2.3289811611175537, 2.5890307426452637, 2.8490803241729736, 3.1091299057006836, 3.3691794872283936, 3.6292290687561035, 3.8892788887023926, 4.149328231811523, 4.4093780517578125, 4.669427871704102, 4.929477214813232, 5.1895270347595215, 5.449576377868652, 5.709626197814941, 5.969675540924072, 6.229725360870361, 6.489774703979492, 6.749824523925781, 7.00987434387207, 7.269924163818359, 7.52997350692749, 7.790023326873779, 8.05007266998291, 8.3101224899292, 8.570172309875488, 8.830221176147461, 9.09027099609375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 7.0, 7.0, 10.0, 13.0, 8.0, 11.0, 16.0, 21.0, 30.0, 27.0, 32.0, 33.0, 40.0, 41.0, 38.0, 41.0, 44.0, 46.0, 39.0, 45.0, 50.0, 35.0, 39.0, 34.0, 42.0, 40.0, 41.0, 27.0, 17.0, 14.0, 17.0, 15.0, 16.0, 10.0, 12.0, 15.0, 4.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.416705131530762, -4.264392852783203, -4.112080097198486, -3.9597678184509277, -3.807455539703369, -3.6551430225372314, -3.5028305053710938, -3.350518226623535, -3.1982057094573975, -3.0458931922912598, -2.893580913543701, -2.7412683963775635, -2.588955879211426, -2.436643600463867, -2.2843310832977295, -2.132018566131592, -1.9797062873840332, -1.827393889427185, -1.675081491470337, -1.5227689743041992, -1.370456576347351, -1.218144178390503, -1.0658316612243652, -0.9135192632675171, -0.761206865310669, -0.6088944673538208, -0.4565820097923279, -0.30426958203315735, -0.15195715427398682, 0.0003552436828613281, 0.15266770124435425, 0.30498015880584717, 0.4572920799255371, 0.6096044778823853, 0.7619169354438782, 0.9142293930053711, 1.0665417909622192, 1.2188541889190674, 1.371166706085205, 1.5234791040420532, 1.6757915019989014, 1.8281038999557495, 1.9804162979125977, 2.1327288150787354, 2.285041332244873, 2.4373536109924316, 2.5896661281585693, 2.741978645324707, 2.8942909240722656, 3.0466034412384033, 3.198915719985962, 3.3512282371520996, 3.503540515899658, 3.655853033065796, 3.8081655502319336, 3.960477828979492, 4.112790107727051, 4.265102386474609, 4.417415142059326, 4.569727420806885, 4.722039699554443, 4.87435245513916, 5.026664733886719, 5.178977012634277, 5.331289768218994]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 8.0, 9.0, 12.0, 17.0, 24.0, 44.0, 70.0, 96.0, 192.0, 295.0, 494.0, 863.0, 1634.0, 2805.0, 5081.0, 9053.0, 16830.0, 30664.0, 58479.0, 122490.0, 240919.0, 264025.0, 146385.0, 69357.0, 35628.0, 19145.0, 10531.0, 5650.0, 3376.0, 1944.0, 995.0, 600.0, 334.0, 191.0, 126.0, 78.0, 34.0, 25.0, 19.0, 8.0, 8.0, 6.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5419921875, -1.499298095703125, -1.45660400390625, -1.413909912109375, -1.3712158203125, -1.328521728515625, -1.28582763671875, -1.243133544921875, -1.200439453125, -1.157745361328125, -1.11505126953125, -1.072357177734375, -1.0296630859375, -0.986968994140625, -0.94427490234375, -0.901580810546875, -0.85888671875, -0.816192626953125, -0.77349853515625, -0.730804443359375, -0.6881103515625, -0.645416259765625, -0.60272216796875, -0.560028076171875, -0.517333984375, -0.474639892578125, -0.43194580078125, -0.389251708984375, -0.3465576171875, -0.303863525390625, -0.26116943359375, -0.218475341796875, -0.17578125, -0.133087158203125, -0.09039306640625, -0.047698974609375, -0.0050048828125, 0.037689208984375, 0.08038330078125, 0.123077392578125, 0.165771484375, 0.208465576171875, 0.25115966796875, 0.293853759765625, 0.3365478515625, 0.379241943359375, 0.42193603515625, 0.464630126953125, 0.50732421875, 0.550018310546875, 0.59271240234375, 0.635406494140625, 0.6781005859375, 0.720794677734375, 0.76348876953125, 0.806182861328125, 0.848876953125, 0.891571044921875, 0.93426513671875, 0.976959228515625, 1.0196533203125, 1.062347412109375, 1.10504150390625, 1.147735595703125, 1.1904296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 10.0, 6.0, 12.0, 13.0, 18.0, 19.0, 23.0, 23.0, 23.0, 29.0, 30.0, 37.0, 39.0, 31.0, 37.0, 38.0, 52.0, 36.0, 44.0, 29.0, 38.0, 40.0, 42.0, 51.0, 29.0, 19.0, 24.0, 21.0, 23.0, 25.0, 18.0, 14.0, 15.0, 14.0, 10.0, 7.0, 12.0, 4.0, 5.0, 7.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.6455078125, -0.6254806518554688, -0.6054534912109375, -0.5854263305664062, -0.565399169921875, -0.5453720092773438, -0.5253448486328125, -0.5053176879882812, -0.48529052734375, -0.46526336669921875, -0.4452362060546875, -0.42520904541015625, -0.405181884765625, -0.38515472412109375, -0.3651275634765625, -0.34510040283203125, -0.3250732421875, -0.30504608154296875, -0.2850189208984375, -0.26499176025390625, -0.244964599609375, -0.22493743896484375, -0.2049102783203125, -0.18488311767578125, -0.16485595703125, -0.14482879638671875, -0.1248016357421875, -0.10477447509765625, -0.084747314453125, -0.06472015380859375, -0.0446929931640625, -0.02466583251953125, -0.004638671875, 0.01538848876953125, 0.0354156494140625, 0.05544281005859375, 0.075469970703125, 0.09549713134765625, 0.1155242919921875, 0.13555145263671875, 0.15557861328125, 0.17560577392578125, 0.1956329345703125, 0.21566009521484375, 0.235687255859375, 0.25571441650390625, 0.2757415771484375, 0.29576873779296875, 0.3157958984375, 0.33582305908203125, 0.3558502197265625, 0.37587738037109375, 0.395904541015625, 0.41593170166015625, 0.4359588623046875, 0.45598602294921875, 0.47601318359375, 0.49604034423828125, 0.5160675048828125, 0.5360946655273438, 0.556121826171875, 0.5761489868164062, 0.5961761474609375, 0.6162033081054688, 0.63623046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 5.0, 12.0, 7.0, 5.0, 7.0, 16.0, 21.0, 23.0, 29.0, 70.0, 84.0, 146.0, 227.0, 415.0, 750.0, 1350.0, 2531.0, 5091.0, 10971.0, 25082.0, 60259.0, 176589.0, 415399.0, 221698.0, 73074.0, 29547.0, 12840.0, 5958.0, 2906.0, 1460.0, 810.0, 490.0, 234.0, 157.0, 75.0, 53.0, 48.0, 23.0, 19.0, 20.0, 11.0, 9.0, 7.0, 4.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9541015625, -1.8880767822265625, -1.822052001953125, -1.7560272216796875, -1.69000244140625, -1.6239776611328125, -1.557952880859375, -1.4919281005859375, -1.4259033203125, -1.3598785400390625, -1.293853759765625, -1.2278289794921875, -1.16180419921875, -1.0957794189453125, -1.029754638671875, -0.9637298583984375, -0.897705078125, -0.8316802978515625, -0.765655517578125, -0.6996307373046875, -0.63360595703125, -0.5675811767578125, -0.501556396484375, -0.4355316162109375, -0.3695068359375, -0.3034820556640625, -0.237457275390625, -0.1714324951171875, -0.10540771484375, -0.0393829345703125, 0.026641845703125, 0.0926666259765625, 0.15869140625, 0.2247161865234375, 0.290740966796875, 0.3567657470703125, 0.42279052734375, 0.4888153076171875, 0.554840087890625, 0.6208648681640625, 0.6868896484375, 0.7529144287109375, 0.818939208984375, 0.8849639892578125, 0.95098876953125, 1.0170135498046875, 1.083038330078125, 1.1490631103515625, 1.215087890625, 1.2811126708984375, 1.347137451171875, 1.4131622314453125, 1.47918701171875, 1.5452117919921875, 1.611236572265625, 1.6772613525390625, 1.7432861328125, 1.8093109130859375, 1.875335693359375, 1.9413604736328125, 2.00738525390625, 2.0734100341796875, 2.139434814453125, 2.2054595947265625, 2.271484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 9.0, 12.0, 8.0, 11.0, 10.0, 21.0, 12.0, 21.0, 20.0, 22.0, 30.0, 37.0, 28.0, 40.0, 43.0, 60.0, 47.0, 43.0, 35.0, 60.0, 37.0, 43.0, 48.0, 37.0, 31.0, 37.0, 28.0, 23.0, 25.0, 11.0, 12.0, 13.0, 18.0, 5.0, 10.0, 4.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90234375, -1.835845947265625, -1.76934814453125, -1.702850341796875, -1.6363525390625, -1.569854736328125, -1.50335693359375, -1.436859130859375, -1.370361328125, -1.303863525390625, -1.23736572265625, -1.170867919921875, -1.1043701171875, -1.037872314453125, -0.97137451171875, -0.904876708984375, -0.83837890625, -0.771881103515625, -0.70538330078125, -0.638885498046875, -0.5723876953125, -0.505889892578125, -0.43939208984375, -0.372894287109375, -0.306396484375, -0.239898681640625, -0.17340087890625, -0.106903076171875, -0.0404052734375, 0.026092529296875, 0.09259033203125, 0.159088134765625, 0.2255859375, 0.292083740234375, 0.35858154296875, 0.425079345703125, 0.4915771484375, 0.558074951171875, 0.62457275390625, 0.691070556640625, 0.757568359375, 0.824066162109375, 0.89056396484375, 0.957061767578125, 1.0235595703125, 1.090057373046875, 1.15655517578125, 1.223052978515625, 1.28955078125, 1.356048583984375, 1.42254638671875, 1.489044189453125, 1.5555419921875, 1.622039794921875, 1.68853759765625, 1.755035400390625, 1.821533203125, 1.888031005859375, 1.95452880859375, 2.021026611328125, 2.0875244140625, 2.154022216796875, 2.22052001953125, 2.287017822265625, 2.353515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 15.0, 27.0, 17.0, 36.0, 41.0, 60.0, 88.0, 126.0, 198.0, 282.0, 396.0, 648.0, 930.0, 1341.0, 2256.0, 3525.0, 5546.0, 9251.0, 15338.0, 26170.0, 46559.0, 93054.0, 200505.0, 282363.0, 176256.0, 81606.0, 41472.0, 23672.0, 14067.0, 8349.0, 5222.0, 3169.0, 2089.0, 1313.0, 829.0, 560.0, 393.0, 250.0, 152.0, 105.0, 91.0, 70.0, 28.0, 20.0, 15.0, 21.0, 16.0, 7.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.7003097534179688, -0.6764984130859375, -0.6526870727539062, -0.628875732421875, -0.6050643920898438, -0.5812530517578125, -0.5574417114257812, -0.53363037109375, -0.5098190307617188, -0.4860076904296875, -0.46219635009765625, -0.438385009765625, -0.41457366943359375, -0.3907623291015625, -0.36695098876953125, -0.3431396484375, -0.31932830810546875, -0.2955169677734375, -0.27170562744140625, -0.247894287109375, -0.22408294677734375, -0.2002716064453125, -0.17646026611328125, -0.15264892578125, -0.12883758544921875, -0.1050262451171875, -0.08121490478515625, -0.057403564453125, -0.03359222412109375, -0.0097808837890625, 0.01403045654296875, 0.037841796875, 0.06165313720703125, 0.0854644775390625, 0.10927581787109375, 0.133087158203125, 0.15689849853515625, 0.1807098388671875, 0.20452117919921875, 0.22833251953125, 0.25214385986328125, 0.2759552001953125, 0.29976654052734375, 0.323577880859375, 0.34738922119140625, 0.3712005615234375, 0.39501190185546875, 0.4188232421875, 0.44263458251953125, 0.4664459228515625, 0.49025726318359375, 0.514068603515625, 0.5378799438476562, 0.5616912841796875, 0.5855026245117188, 0.60931396484375, 0.6331253051757812, 0.6569366455078125, 0.6807479858398438, 0.704559326171875, 0.7283706665039062, 0.7521820068359375, 0.7759933471679688, 0.7998046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 6.0, 6.0, 8.0, 4.0, 14.0, 13.0, 13.0, 17.0, 27.0, 39.0, 70.0, 68.0, 94.0, 120.0, 111.0, 94.0, 52.0, 44.0, 35.0, 27.0, 20.0, 18.0, 7.0, 15.0, 11.0, 7.0, 14.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002014636993408203, -0.00019466131925582886, -0.0001878589391708374, -0.00018105655908584595, -0.0001742541790008545, -0.00016745179891586304, -0.00016064941883087158, -0.00015384703874588013, -0.00014704465866088867, -0.00014024227857589722, -0.00013343989849090576, -0.0001266375184059143, -0.00011983513832092285, -0.0001130327582359314, -0.00010623037815093994, -9.942799806594849e-05, -9.262561798095703e-05, -8.582323789596558e-05, -7.902085781097412e-05, -7.221847772598267e-05, -6.541609764099121e-05, -5.8613717555999756e-05, -5.18113374710083e-05, -4.5008957386016846e-05, -3.820657730102539e-05, -3.1404197216033936e-05, -2.460181713104248e-05, -1.7799437046051025e-05, -1.099705696105957e-05, -4.194676876068115e-06, 2.60770320892334e-06, 9.410083293914795e-06, 1.621246337890625e-05, 2.3014843463897705e-05, 2.981722354888916e-05, 3.6619603633880615e-05, 4.342198371887207e-05, 5.0224363803863525e-05, 5.702674388885498e-05, 6.382912397384644e-05, 7.063150405883789e-05, 7.743388414382935e-05, 8.42362642288208e-05, 9.103864431381226e-05, 9.784102439880371e-05, 0.00010464340448379517, 0.00011144578456878662, 0.00011824816465377808, 0.00012505054473876953, 0.00013185292482376099, 0.00013865530490875244, 0.0001454576849937439, 0.00015226006507873535, 0.0001590624451637268, 0.00016586482524871826, 0.00017266720533370972, 0.00017946958541870117, 0.00018627196550369263, 0.00019307434558868408, 0.00019987672567367554, 0.000206679105758667, 0.00021348148584365845, 0.0002202838659286499, 0.00022708624601364136, 0.0002338886260986328]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 18.0, 12.0, 30.0, 47.0, 58.0, 79.0, 138.0, 168.0, 242.0, 402.0, 599.0, 1017.0, 1649.0, 2508.0, 4279.0, 7417.0, 13081.0, 23924.0, 45748.0, 94208.0, 215745.0, 302568.0, 173180.0, 75736.0, 37878.0, 20193.0, 11288.0, 6405.0, 3770.0, 2259.0, 1411.0, 876.0, 512.0, 388.0, 217.0, 150.0, 105.0, 78.0, 57.0, 29.0, 25.0, 12.0, 15.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.837890625, -0.812774658203125, -0.78765869140625, -0.762542724609375, -0.7374267578125, -0.712310791015625, -0.68719482421875, -0.662078857421875, -0.636962890625, -0.611846923828125, -0.58673095703125, -0.561614990234375, -0.5364990234375, -0.511383056640625, -0.48626708984375, -0.461151123046875, -0.43603515625, -0.410919189453125, -0.38580322265625, -0.360687255859375, -0.3355712890625, -0.310455322265625, -0.28533935546875, -0.260223388671875, -0.235107421875, -0.209991455078125, -0.18487548828125, -0.159759521484375, -0.1346435546875, -0.109527587890625, -0.08441162109375, -0.059295654296875, -0.0341796875, -0.009063720703125, 0.01605224609375, 0.041168212890625, 0.0662841796875, 0.091400146484375, 0.11651611328125, 0.141632080078125, 0.166748046875, 0.191864013671875, 0.21697998046875, 0.242095947265625, 0.2672119140625, 0.292327880859375, 0.31744384765625, 0.342559814453125, 0.36767578125, 0.392791748046875, 0.41790771484375, 0.443023681640625, 0.4681396484375, 0.493255615234375, 0.51837158203125, 0.543487548828125, 0.568603515625, 0.593719482421875, 0.61883544921875, 0.643951416015625, 0.6690673828125, 0.694183349609375, 0.71929931640625, 0.744415283203125, 0.76953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 7.0, 8.0, 9.0, 15.0, 20.0, 28.0, 30.0, 46.0, 47.0, 79.0, 85.0, 110.0, 99.0, 91.0, 67.0, 57.0, 30.0, 30.0, 26.0, 20.0, 24.0, 11.0, 13.0, 9.0, 2.0, 2.0, 3.0, 1.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9232864379882812, -0.8890533447265625, -0.8548202514648438, -0.820587158203125, -0.7863540649414062, -0.7521209716796875, -0.7178878784179688, -0.68365478515625, -0.6494216918945312, -0.6151885986328125, -0.5809555053710938, -0.546722412109375, -0.5124893188476562, -0.4782562255859375, -0.44402313232421875, -0.4097900390625, -0.37555694580078125, -0.3413238525390625, -0.30709075927734375, -0.272857666015625, -0.23862457275390625, -0.2043914794921875, -0.17015838623046875, -0.13592529296875, -0.10169219970703125, -0.0674591064453125, -0.03322601318359375, 0.001007080078125, 0.03524017333984375, 0.0694732666015625, 0.10370635986328125, 0.137939453125, 0.17217254638671875, 0.2064056396484375, 0.24063873291015625, 0.274871826171875, 0.30910491943359375, 0.3433380126953125, 0.37757110595703125, 0.41180419921875, 0.44603729248046875, 0.4802703857421875, 0.5145034790039062, 0.548736572265625, 0.5829696655273438, 0.6172027587890625, 0.6514358520507812, 0.6856689453125, 0.7199020385742188, 0.7541351318359375, 0.7883682250976562, 0.822601318359375, 0.8568344116210938, 0.8910675048828125, 0.9253005981445312, 0.95953369140625, 0.9937667846679688, 1.0279998779296875, 1.0622329711914062, 1.096466064453125, 1.1306991577148438, 1.1649322509765625, 1.1991653442382812, 1.2333984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 7.0, 7.0, 8.0, 4.0, 12.0, 18.0, 19.0, 30.0, 25.0, 29.0, 36.0, 36.0, 34.0, 33.0, 46.0, 50.0, 44.0, 50.0, 54.0, 42.0, 63.0, 53.0, 40.0, 36.0, 35.0, 21.0, 15.0, 27.0, 27.0, 10.0, 8.0, 11.0, 11.0, 7.0, 12.0, 4.0, 6.0, 5.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-5.08251953125, -4.935297966003418, -4.788075923919678, -4.6408538818359375, -4.4936323165893555, -4.346410751342773, -4.199188709259033, -4.051966667175293, -3.904745101928711, -3.75752329826355, -3.6103014945983887, -3.4630796909332275, -3.3158578872680664, -3.1686360836029053, -3.021414279937744, -2.874192476272583, -2.726970672607422, -2.5797488689422607, -2.4325270652770996, -2.2853052616119385, -2.1380834579467773, -1.9908616542816162, -1.843639850616455, -1.696418046951294, -1.5491962432861328, -1.4019744396209717, -1.2547526359558105, -1.1075308322906494, -0.9603090286254883, -0.8130872249603271, -0.665865421295166, -0.5186436176300049, -0.37142229080200195, -0.22420048713684082, -0.07697868347167969, 0.07024312019348145, 0.21746492385864258, 0.3646867275238037, 0.5119085311889648, 0.659130334854126, 0.8063521385192871, 0.9535739421844482, 1.1007957458496094, 1.2480175495147705, 1.3952393531799316, 1.5424611568450928, 1.689682960510254, 1.836904764175415, 1.9841265678405762, 2.1313483715057373, 2.2785701751708984, 2.4257919788360596, 2.5730137825012207, 2.720235586166382, 2.867457389831543, 3.014679193496704, 3.1619009971618652, 3.3091228008270264, 3.4563446044921875, 3.6035664081573486, 3.7507882118225098, 3.898010015487671, 4.045231819152832, 4.192453384399414, 4.339675426483154]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 8.0, 12.0, 6.0, 10.0, 13.0, 13.0, 20.0, 24.0, 23.0, 31.0, 21.0, 43.0, 49.0, 44.0, 38.0, 55.0, 40.0, 50.0, 36.0, 46.0, 32.0, 39.0, 34.0, 30.0, 26.0, 40.0, 26.0, 29.0, 20.0, 22.0, 24.0, 14.0, 19.0, 10.0, 9.0, 11.0, 10.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-5.955738067626953, -5.759530544281006, -5.5633225440979, -5.367115020751953, -5.170907020568848, -4.9746994972229, -4.778491973876953, -4.582283973693848, -4.386075973510742, -4.189868450164795, -3.9936604499816895, -3.797452926635742, -3.6012449264526367, -3.4050374031066895, -3.208829641342163, -3.0126218795776367, -2.8164143562316895, -2.620206594467163, -2.4239988327026367, -2.2277913093566895, -2.031583309173584, -1.8353756666183472, -1.6391680240631104, -1.442960262298584, -1.2467525005340576, -1.0505447387695312, -0.8543370366096497, -0.6581293344497681, -0.4619215726852417, -0.26571381092071533, -0.06950616836547852, 0.12670159339904785, 0.3229098320007324, 0.5191175937652588, 0.7153252959251404, 0.911532998085022, 1.1077407598495483, 1.3039485216140747, 1.5001561641693115, 1.696363925933838, 1.8925716876983643, 2.0887794494628906, 2.284987211227417, 2.4811949729919434, 2.6774024963378906, 2.873610496520996, 3.0698180198669434, 3.2660257816314697, 3.462233543395996, 3.6584413051605225, 3.854649066925049, 4.050856590270996, 4.247064590454102, 4.443272113800049, 4.639479637145996, 4.835687637329102, 5.031895637512207, 5.228103160858154, 5.42431116104126, 5.620518684387207, 5.8167266845703125, 6.01293420791626, 6.209141731262207, 6.4053497314453125, 6.60155725479126]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 12.0, 12.0, 18.0, 25.0, 39.0, 51.0, 78.0, 108.0, 159.0, 265.0, 394.0, 629.0, 1032.0, 1900.0, 3415.0, 6248.0, 12650.0, 25786.0, 55685.0, 129117.0, 329779.0, 1078785.0, 1739220.0, 488596.0, 178593.0, 74765.0, 33400.0, 15928.0, 7994.0, 4112.0, 2233.0, 1233.0, 777.0, 427.0, 292.0, 173.0, 101.0, 74.0, 56.0, 35.0, 27.0, 16.0, 13.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1796875, -1.144134521484375, -1.10858154296875, -1.073028564453125, -1.0374755859375, -1.001922607421875, -0.96636962890625, -0.930816650390625, -0.895263671875, -0.859710693359375, -0.82415771484375, -0.788604736328125, -0.7530517578125, -0.717498779296875, -0.68194580078125, -0.646392822265625, -0.61083984375, -0.575286865234375, -0.53973388671875, -0.504180908203125, -0.4686279296875, -0.433074951171875, -0.39752197265625, -0.361968994140625, -0.326416015625, -0.290863037109375, -0.25531005859375, -0.219757080078125, -0.1842041015625, -0.148651123046875, -0.11309814453125, -0.077545166015625, -0.0419921875, -0.006439208984375, 0.02911376953125, 0.064666748046875, 0.1002197265625, 0.135772705078125, 0.17132568359375, 0.206878662109375, 0.242431640625, 0.277984619140625, 0.31353759765625, 0.349090576171875, 0.3846435546875, 0.420196533203125, 0.45574951171875, 0.491302490234375, 0.52685546875, 0.562408447265625, 0.59796142578125, 0.633514404296875, 0.6690673828125, 0.704620361328125, 0.74017333984375, 0.775726318359375, 0.811279296875, 0.846832275390625, 0.88238525390625, 0.917938232421875, 0.9534912109375, 0.989044189453125, 1.02459716796875, 1.060150146484375, 1.095703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 2.0, 8.0, 7.0, 8.0, 9.0, 12.0, 13.0, 6.0, 24.0, 20.0, 24.0, 31.0, 29.0, 33.0, 37.0, 44.0, 41.0, 36.0, 37.0, 39.0, 56.0, 43.0, 52.0, 38.0, 33.0, 37.0, 29.0, 30.0, 24.0, 21.0, 17.0, 16.0, 22.0, 18.0, 19.0, 15.0, 13.0, 7.0, 14.0, 4.0, 5.0, 7.0, 9.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.80126953125, -0.7776947021484375, -0.754119873046875, -0.7305450439453125, -0.70697021484375, -0.6833953857421875, -0.659820556640625, -0.6362457275390625, -0.6126708984375, -0.5890960693359375, -0.565521240234375, -0.5419464111328125, -0.51837158203125, -0.4947967529296875, -0.471221923828125, -0.4476470947265625, -0.424072265625, -0.4004974365234375, -0.376922607421875, -0.3533477783203125, -0.32977294921875, -0.3061981201171875, -0.282623291015625, -0.2590484619140625, -0.2354736328125, -0.2118988037109375, -0.188323974609375, -0.1647491455078125, -0.14117431640625, -0.1175994873046875, -0.094024658203125, -0.0704498291015625, -0.046875, -0.0233001708984375, 0.000274658203125, 0.0238494873046875, 0.04742431640625, 0.0709991455078125, 0.094573974609375, 0.1181488037109375, 0.1417236328125, 0.1652984619140625, 0.188873291015625, 0.2124481201171875, 0.23602294921875, 0.2595977783203125, 0.283172607421875, 0.3067474365234375, 0.330322265625, 0.3538970947265625, 0.377471923828125, 0.4010467529296875, 0.42462158203125, 0.4481964111328125, 0.471771240234375, 0.4953460693359375, 0.5189208984375, 0.5424957275390625, 0.566070556640625, 0.5896453857421875, 0.61322021484375, 0.6367950439453125, 0.660369873046875, 0.6839447021484375, 0.70751953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 5.0, 6.0, 13.0, 17.0, 18.0, 34.0, 44.0, 83.0, 114.0, 185.0, 312.0, 618.0, 1036.0, 2231.0, 5060.0, 13811.0, 44613.0, 169206.0, 811434.0, 2380145.0, 582101.0, 128509.0, 34882.0, 11413.0, 4285.0, 1950.0, 944.0, 477.0, 260.0, 147.0, 102.0, 68.0, 40.0, 31.0, 24.0, 16.0, 11.0, 3.0, 8.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.9140625, -2.824127197265625, -2.73419189453125, -2.644256591796875, -2.5543212890625, -2.464385986328125, -2.37445068359375, -2.284515380859375, -2.194580078125, -2.104644775390625, -2.01470947265625, -1.924774169921875, -1.8348388671875, -1.744903564453125, -1.65496826171875, -1.565032958984375, -1.47509765625, -1.385162353515625, -1.29522705078125, -1.205291748046875, -1.1153564453125, -1.025421142578125, -0.93548583984375, -0.845550537109375, -0.755615234375, -0.665679931640625, -0.57574462890625, -0.485809326171875, -0.3958740234375, -0.305938720703125, -0.21600341796875, -0.126068115234375, -0.0361328125, 0.053802490234375, 0.14373779296875, 0.233673095703125, 0.3236083984375, 0.413543701171875, 0.50347900390625, 0.593414306640625, 0.683349609375, 0.773284912109375, 0.86322021484375, 0.953155517578125, 1.0430908203125, 1.133026123046875, 1.22296142578125, 1.312896728515625, 1.40283203125, 1.492767333984375, 1.58270263671875, 1.672637939453125, 1.7625732421875, 1.852508544921875, 1.94244384765625, 2.032379150390625, 2.122314453125, 2.212249755859375, 2.30218505859375, 2.392120361328125, 2.4820556640625, 2.571990966796875, 2.66192626953125, 2.751861572265625, 2.841796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 10.0, 13.0, 16.0, 36.0, 49.0, 97.0, 132.0, 245.0, 385.0, 643.0, 901.0, 594.0, 337.0, 218.0, 161.0, 80.0, 57.0, 32.0, 23.0, 16.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.365875244140625, -3.28057861328125, -3.195281982421875, -3.1099853515625, -3.024688720703125, -2.93939208984375, -2.854095458984375, -2.768798828125, -2.683502197265625, -2.59820556640625, -2.512908935546875, -2.4276123046875, -2.342315673828125, -2.25701904296875, -2.171722412109375, -2.08642578125, -2.001129150390625, -1.91583251953125, -1.830535888671875, -1.7452392578125, -1.659942626953125, -1.57464599609375, -1.489349365234375, -1.404052734375, -1.318756103515625, -1.23345947265625, -1.148162841796875, -1.0628662109375, -0.977569580078125, -0.89227294921875, -0.806976318359375, -0.7216796875, -0.636383056640625, -0.55108642578125, -0.465789794921875, -0.3804931640625, -0.295196533203125, -0.20989990234375, -0.124603271484375, -0.039306640625, 0.045989990234375, 0.13128662109375, 0.216583251953125, 0.3018798828125, 0.387176513671875, 0.47247314453125, 0.557769775390625, 0.64306640625, 0.728363037109375, 0.81365966796875, 0.898956298828125, 0.9842529296875, 1.069549560546875, 1.15484619140625, 1.240142822265625, 1.325439453125, 1.410736083984375, 1.49603271484375, 1.581329345703125, 1.6666259765625, 1.751922607421875, 1.83721923828125, 1.922515869140625, 2.0078125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 5.0, 18.0, 34.0, 48.0, 82.0, 114.0, 129.0, 146.0, 126.0, 119.0, 76.0, 45.0, 31.0, 15.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.349769592285156, -7.915297031402588, -7.4808244705200195, -7.046351432800293, -6.611879348754883, -6.177406311035156, -5.742933750152588, -5.3084611892700195, -4.873988628387451, -4.439516067504883, -4.0050435066223145, -3.570570707321167, -3.1360981464385986, -2.7016255855560303, -2.267152786254883, -1.8326802253723145, -1.398207664489746, -0.963735044002533, -0.5292624235153198, -0.09478974342346191, 0.33968281745910645, 0.7741553783416748, 1.2086281776428223, 1.6431007385253906, 2.077573299407959, 2.5120458602905273, 2.9465184211730957, 3.380991220474243, 3.8154637813568115, 4.249936103820801, 4.684409141540527, 5.118881702423096, 5.553354263305664, 5.987826824188232, 6.422299385070801, 6.856772422790527, 7.2912445068359375, 7.725717544555664, 8.16019058227539, 8.5946626663208, 9.029134750366211, 9.463607788085938, 9.898079872131348, 10.332552909851074, 10.767024993896484, 11.201498031616211, 11.635971069335938, 12.070443153381348, 12.504916191101074, 12.9393892288208, 13.373861312866211, 13.808334350585938, 14.242806434631348, 14.677279472351074, 15.111751556396484, 15.546224594116211, 15.980697631835938, 16.415170669555664, 16.84964370727539, 17.284114837646484, 17.71858787536621, 18.153060913085938, 18.587533950805664, 19.02200698852539, 19.456478118896484]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 5.0, 3.0, 8.0, 12.0, 13.0, 22.0, 17.0, 19.0, 26.0, 19.0, 19.0, 34.0, 34.0, 40.0, 37.0, 25.0, 41.0, 35.0, 42.0, 27.0, 26.0, 42.0, 38.0, 33.0, 40.0, 38.0, 36.0, 33.0, 16.0, 30.0, 22.0, 28.0, 17.0, 18.0, 10.0, 18.0, 10.0, 9.0, 10.0, 8.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.363385200500488, -5.187209129333496, -5.011033058166504, -4.834856986999512, -4.658681392669678, -4.4825053215026855, -4.306329250335693, -4.130153179168701, -3.953977108001709, -3.777801036834717, -3.6016252040863037, -3.4254491329193115, -3.2492730617523193, -3.0730972290039062, -2.896921157836914, -2.720745086669922, -2.544569253921509, -2.3683931827545166, -2.1922173500061035, -2.0160412788391113, -1.8398652076721191, -1.6636892557144165, -1.4875133037567139, -1.3113372325897217, -1.135161280632019, -0.9589852690696716, -0.7828092575073242, -0.6066333055496216, -0.43045729398727417, -0.25428128242492676, -0.07810533046722412, 0.09807074069976807, 0.2742466926574707, 0.4504227042198181, 0.6265987157821655, 0.8027746677398682, 0.9789506793022156, 1.155126690864563, 1.3313026428222656, 1.5074787139892578, 1.6836546659469604, 1.859830617904663, 2.0360066890716553, 2.2121825218200684, 2.3883585929870605, 2.5645346641540527, 2.740710735321045, 2.916886806488037, 3.09306263923645, 3.2692387104034424, 3.4454145431518555, 3.6215906143188477, 3.79776668548584, 3.973942756652832, 4.150118827819824, 4.326294898986816, 4.50247049331665, 4.678646564483643, 4.854822635650635, 5.030998229980469, 5.207174301147461, 5.383350372314453, 5.559526443481445, 5.7357025146484375, 5.91187858581543]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 2.0, 6.0, 8.0, 15.0, 20.0, 37.0, 59.0, 94.0, 116.0, 206.0, 311.0, 500.0, 721.0, 1234.0, 1834.0, 2821.0, 4301.0, 6617.0, 10311.0, 15708.0, 24291.0, 38163.0, 65009.0, 126281.0, 234239.0, 227729.0, 120356.0, 62901.0, 37511.0, 23491.0, 15132.0, 9985.0, 6582.0, 4190.0, 2789.0, 1768.0, 1148.0, 730.0, 471.0, 315.0, 195.0, 150.0, 68.0, 52.0, 34.0, 20.0, 14.0, 10.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.134033203125, -1.09619140625, -1.058349609375, -1.0205078125, -0.982666015625, -0.94482421875, -0.906982421875, -0.869140625, -0.831298828125, -0.79345703125, -0.755615234375, -0.7177734375, -0.679931640625, -0.64208984375, -0.604248046875, -0.56640625, -0.528564453125, -0.49072265625, -0.452880859375, -0.4150390625, -0.377197265625, -0.33935546875, -0.301513671875, -0.263671875, -0.225830078125, -0.18798828125, -0.150146484375, -0.1123046875, -0.074462890625, -0.03662109375, 0.001220703125, 0.0390625, 0.076904296875, 0.11474609375, 0.152587890625, 0.1904296875, 0.228271484375, 0.26611328125, 0.303955078125, 0.341796875, 0.379638671875, 0.41748046875, 0.455322265625, 0.4931640625, 0.531005859375, 0.56884765625, 0.606689453125, 0.64453125, 0.682373046875, 0.72021484375, 0.758056640625, 0.7958984375, 0.833740234375, 0.87158203125, 0.909423828125, 0.947265625, 0.985107421875, 1.02294921875, 1.060791015625, 1.0986328125, 1.136474609375, 1.17431640625, 1.212158203125, 1.25]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 10.0, 11.0, 16.0, 9.0, 20.0, 23.0, 29.0, 27.0, 38.0, 35.0, 28.0, 58.0, 50.0, 48.0, 43.0, 47.0, 51.0, 34.0, 47.0, 52.0, 43.0, 36.0, 38.0, 32.0, 31.0, 29.0, 11.0, 16.0, 12.0, 14.0, 11.0, 12.0, 10.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0517578125, -1.0201187133789062, -0.9884796142578125, -0.9568405151367188, -0.925201416015625, -0.8935623168945312, -0.8619232177734375, -0.8302841186523438, -0.79864501953125, -0.7670059204101562, -0.7353668212890625, -0.7037277221679688, -0.672088623046875, -0.6404495239257812, -0.6088104248046875, -0.5771713256835938, -0.5455322265625, -0.5138931274414062, -0.4822540283203125, -0.45061492919921875, -0.418975830078125, -0.38733673095703125, -0.3556976318359375, -0.32405853271484375, -0.29241943359375, -0.26078033447265625, -0.2291412353515625, -0.19750213623046875, -0.165863037109375, -0.13422393798828125, -0.1025848388671875, -0.07094573974609375, -0.039306640625, -0.00766754150390625, 0.0239715576171875, 0.05561065673828125, 0.087249755859375, 0.11888885498046875, 0.1505279541015625, 0.18216705322265625, 0.21380615234375, 0.24544525146484375, 0.2770843505859375, 0.30872344970703125, 0.340362548828125, 0.37200164794921875, 0.4036407470703125, 0.43527984619140625, 0.4669189453125, 0.49855804443359375, 0.5301971435546875, 0.5618362426757812, 0.593475341796875, 0.6251144409179688, 0.6567535400390625, 0.6883926391601562, 0.72003173828125, 0.7516708374023438, 0.7833099365234375, 0.8149490356445312, 0.846588134765625, 0.8782272338867188, 0.9098663330078125, 0.9415054321289062, 0.97314453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 6.0, 6.0, 13.0, 11.0, 7.0, 11.0, 22.0, 34.0, 46.0, 76.0, 115.0, 213.0, 499.0, 1183.0, 3483.0, 10612.0, 31860.0, 105588.0, 510672.0, 289170.0, 63590.0, 20399.0, 6853.0, 2375.0, 876.0, 357.0, 152.0, 100.0, 46.0, 49.0, 16.0, 22.0, 15.0, 11.0, 20.0, 8.0, 11.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.40655517578125, -3.2994384765625, -3.19232177734375, -3.085205078125, -2.97808837890625, -2.8709716796875, -2.76385498046875, -2.65673828125, -2.54962158203125, -2.4425048828125, -2.33538818359375, -2.228271484375, -2.12115478515625, -2.0140380859375, -1.90692138671875, -1.7998046875, -1.69268798828125, -1.5855712890625, -1.47845458984375, -1.371337890625, -1.26422119140625, -1.1571044921875, -1.04998779296875, -0.94287109375, -0.83575439453125, -0.7286376953125, -0.62152099609375, -0.514404296875, -0.40728759765625, -0.3001708984375, -0.19305419921875, -0.0859375, 0.02117919921875, 0.1282958984375, 0.23541259765625, 0.342529296875, 0.44964599609375, 0.5567626953125, 0.66387939453125, 0.77099609375, 0.87811279296875, 0.9852294921875, 1.09234619140625, 1.199462890625, 1.30657958984375, 1.4136962890625, 1.52081298828125, 1.6279296875, 1.73504638671875, 1.8421630859375, 1.94927978515625, 2.056396484375, 2.16351318359375, 2.2706298828125, 2.37774658203125, 2.48486328125, 2.59197998046875, 2.6990966796875, 2.80621337890625, 2.913330078125, 3.02044677734375, 3.1275634765625, 3.23468017578125, 3.341796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 4.0, 2.0, 8.0, 11.0, 7.0, 16.0, 11.0, 11.0, 22.0, 14.0, 22.0, 29.0, 23.0, 35.0, 39.0, 25.0, 46.0, 37.0, 38.0, 48.0, 45.0, 45.0, 49.0, 38.0, 41.0, 40.0, 33.0, 38.0, 26.0, 32.0, 27.0, 21.0, 24.0, 26.0, 15.0, 9.0, 9.0, 13.0, 5.0, 2.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.267578125, -3.17962646484375, -3.0916748046875, -3.00372314453125, -2.915771484375, -2.82781982421875, -2.7398681640625, -2.65191650390625, -2.56396484375, -2.47601318359375, -2.3880615234375, -2.30010986328125, -2.212158203125, -2.12420654296875, -2.0362548828125, -1.94830322265625, -1.8603515625, -1.77239990234375, -1.6844482421875, -1.59649658203125, -1.508544921875, -1.42059326171875, -1.3326416015625, -1.24468994140625, -1.15673828125, -1.06878662109375, -0.9808349609375, -0.89288330078125, -0.804931640625, -0.71697998046875, -0.6290283203125, -0.54107666015625, -0.453125, -0.36517333984375, -0.2772216796875, -0.18927001953125, -0.101318359375, -0.01336669921875, 0.0745849609375, 0.16253662109375, 0.25048828125, 0.33843994140625, 0.4263916015625, 0.51434326171875, 0.602294921875, 0.69024658203125, 0.7781982421875, 0.86614990234375, 0.9541015625, 1.04205322265625, 1.1300048828125, 1.21795654296875, 1.305908203125, 1.39385986328125, 1.4818115234375, 1.56976318359375, 1.65771484375, 1.74566650390625, 1.8336181640625, 1.92156982421875, 2.009521484375, 2.09747314453125, 2.1854248046875, 2.27337646484375, 2.361328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 5.0, 14.0, 18.0, 18.0, 20.0, 26.0, 48.0, 64.0, 76.0, 114.0, 192.0, 302.0, 530.0, 853.0, 1431.0, 2591.0, 4442.0, 7370.0, 12482.0, 21847.0, 43741.0, 110473.0, 327728.0, 314876.0, 105882.0, 42130.0, 21433.0, 12162.0, 7279.0, 4240.0, 2466.0, 1401.0, 860.0, 524.0, 304.0, 188.0, 112.0, 91.0, 72.0, 28.0, 36.0, 24.0, 18.0, 6.0, 10.0, 8.0, 4.0, 8.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0205078125, -0.9875640869140625, -0.954620361328125, -0.9216766357421875, -0.88873291015625, -0.8557891845703125, -0.822845458984375, -0.7899017333984375, -0.7569580078125, -0.7240142822265625, -0.691070556640625, -0.6581268310546875, -0.62518310546875, -0.5922393798828125, -0.559295654296875, -0.5263519287109375, -0.493408203125, -0.4604644775390625, -0.427520751953125, -0.3945770263671875, -0.36163330078125, -0.3286895751953125, -0.295745849609375, -0.2628021240234375, -0.2298583984375, -0.1969146728515625, -0.163970947265625, -0.1310272216796875, -0.09808349609375, -0.0651397705078125, -0.032196044921875, 0.0007476806640625, 0.03369140625, 0.0666351318359375, 0.099578857421875, 0.1325225830078125, 0.16546630859375, 0.1984100341796875, 0.231353759765625, 0.2642974853515625, 0.2972412109375, 0.3301849365234375, 0.363128662109375, 0.3960723876953125, 0.42901611328125, 0.4619598388671875, 0.494903564453125, 0.5278472900390625, 0.560791015625, 0.5937347412109375, 0.626678466796875, 0.6596221923828125, 0.69256591796875, 0.7255096435546875, 0.758453369140625, 0.7913970947265625, 0.8243408203125, 0.8572845458984375, 0.890228271484375, 0.9231719970703125, 0.95611572265625, 0.9890594482421875, 1.022003173828125, 1.0549468994140625, 1.087890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 8.0, 3.0, 5.0, 7.0, 12.0, 18.0, 21.0, 22.0, 37.0, 64.0, 93.0, 143.0, 162.0, 119.0, 81.0, 59.0, 36.0, 25.0, 17.0, 11.0, 10.0, 8.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002486705780029297, -0.00023988261818885803, -0.00023109465837478638, -0.00022230669856071472, -0.00021351873874664307, -0.0002047307789325714, -0.00019594281911849976, -0.0001871548593044281, -0.00017836689949035645, -0.0001695789396762848, -0.00016079097986221313, -0.00015200302004814148, -0.00014321506023406982, -0.00013442710041999817, -0.00012563914060592651, -0.00011685118079185486, -0.0001080632209777832, -9.927526116371155e-05, -9.048730134963989e-05, -8.169934153556824e-05, -7.291138172149658e-05, -6.412342190742493e-05, -5.533546209335327e-05, -4.6547502279281616e-05, -3.775954246520996e-05, -2.8971582651138306e-05, -2.018362283706665e-05, -1.1395663022994995e-05, -2.60770320892334e-06, 6.1802566051483154e-06, 1.496821641921997e-05, 2.3756176233291626e-05, 3.254413604736328e-05, 4.1332095861434937e-05, 5.012005567550659e-05, 5.890801548957825e-05, 6.76959753036499e-05, 7.648393511772156e-05, 8.527189493179321e-05, 9.405985474586487e-05, 0.00010284781455993652, 0.00011163577437400818, 0.00012042373418807983, 0.0001292116940021515, 0.00013799965381622314, 0.0001467876136302948, 0.00015557557344436646, 0.0001643635332584381, 0.00017315149307250977, 0.00018193945288658142, 0.00019072741270065308, 0.00019951537251472473, 0.0002083033323287964, 0.00021709129214286804, 0.0002258792519569397, 0.00023466721177101135, 0.000243455171585083, 0.00025224313139915466, 0.0002610310912132263, 0.000269819051027298, 0.00027860701084136963, 0.0002873949706554413, 0.00029618293046951294, 0.0003049708902835846, 0.00031375885009765625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 9.0, 6.0, 8.0, 12.0, 22.0, 26.0, 48.0, 68.0, 86.0, 157.0, 285.0, 510.0, 845.0, 1571.0, 2789.0, 4983.0, 9048.0, 16583.0, 32186.0, 72889.0, 204888.0, 402428.0, 172394.0, 63951.0, 29087.0, 15063.0, 8231.0, 4460.0, 2517.0, 1480.0, 806.0, 450.0, 252.0, 154.0, 97.0, 56.0, 34.0, 29.0, 20.0, 15.0, 6.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9482421875, -0.916015625, -0.8837890625, -0.8515625, -0.8193359375, -0.787109375, -0.7548828125, -0.72265625, -0.6904296875, -0.658203125, -0.6259765625, -0.59375, -0.5615234375, -0.529296875, -0.4970703125, -0.46484375, -0.4326171875, -0.400390625, -0.3681640625, -0.3359375, -0.3037109375, -0.271484375, -0.2392578125, -0.20703125, -0.1748046875, -0.142578125, -0.1103515625, -0.078125, -0.0458984375, -0.013671875, 0.0185546875, 0.05078125, 0.0830078125, 0.115234375, 0.1474609375, 0.1796875, 0.2119140625, 0.244140625, 0.2763671875, 0.30859375, 0.3408203125, 0.373046875, 0.4052734375, 0.4375, 0.4697265625, 0.501953125, 0.5341796875, 0.56640625, 0.5986328125, 0.630859375, 0.6630859375, 0.6953125, 0.7275390625, 0.759765625, 0.7919921875, 0.82421875, 0.8564453125, 0.888671875, 0.9208984375, 0.953125, 0.9853515625, 1.017578125, 1.0498046875, 1.08203125, 1.1142578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 6.0, 7.0, 13.0, 12.0, 21.0, 28.0, 42.0, 47.0, 96.0, 115.0, 150.0, 129.0, 93.0, 59.0, 46.0, 38.0, 15.0, 17.0, 10.0, 8.0, 7.0, 2.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.77734375, -1.7288665771484375, -1.680389404296875, -1.6319122314453125, -1.58343505859375, -1.5349578857421875, -1.486480712890625, -1.4380035400390625, -1.3895263671875, -1.3410491943359375, -1.292572021484375, -1.2440948486328125, -1.19561767578125, -1.1471405029296875, -1.098663330078125, -1.0501861572265625, -1.001708984375, -0.9532318115234375, -0.904754638671875, -0.8562774658203125, -0.80780029296875, -0.7593231201171875, -0.710845947265625, -0.6623687744140625, -0.6138916015625, -0.5654144287109375, -0.516937255859375, -0.4684600830078125, -0.41998291015625, -0.3715057373046875, -0.323028564453125, -0.2745513916015625, -0.22607421875, -0.1775970458984375, -0.129119873046875, -0.0806427001953125, -0.03216552734375, 0.0163116455078125, 0.064788818359375, 0.1132659912109375, 0.1617431640625, 0.2102203369140625, 0.258697509765625, 0.3071746826171875, 0.35565185546875, 0.4041290283203125, 0.452606201171875, 0.5010833740234375, 0.549560546875, 0.5980377197265625, 0.646514892578125, 0.6949920654296875, 0.74346923828125, 0.7919464111328125, 0.840423583984375, 0.8889007568359375, 0.9373779296875, 0.9858551025390625, 1.034332275390625, 1.0828094482421875, 1.13128662109375, 1.1797637939453125, 1.228240966796875, 1.2767181396484375, 1.3251953125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 35.0, 292.0, 561.0, 122.0, 6.0, 2.0], "bins": [-136.30062866210938, -134.04249572753906, -131.78436279296875, -129.5262451171875, -127.26811218261719, -125.00997924804688, -122.7518539428711, -120.49372863769531, -118.235595703125, -115.97746276855469, -113.7193374633789, -111.46121215820312, -109.20307922363281, -106.9449462890625, -104.68682098388672, -102.42869567871094, -100.17056274414062, -97.91242980957031, -95.65430450439453, -93.39617919921875, -91.13804626464844, -88.87991333007812, -86.62178802490234, -84.36366271972656, -82.10552978515625, -79.84739685058594, -77.58927154541016, -75.33114624023438, -73.07301330566406, -70.81488037109375, -68.55675506591797, -66.29862976074219, -64.04049682617188, -61.78236770629883, -59.52423858642578, -57.266109466552734, -55.00798034667969, -52.74985122680664, -50.491722106933594, -48.23359298706055, -45.975467681884766, -43.71733856201172, -41.45920944213867, -39.201080322265625, -36.94295120239258, -34.68482208251953, -32.426692962646484, -30.168563842773438, -27.91043472290039, -25.652305603027344, -23.394176483154297, -21.13604736328125, -18.877918243408203, -16.619789123535156, -14.36166000366211, -12.103530883789062, -9.845401763916016, -7.587272644042969, -5.329143524169922, -3.071014404296875, -0.8128852844238281, 1.4452438354492188, 3.7033729553222656, 5.9615020751953125, 8.21963119506836]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 6.0, 6.0, 4.0, 3.0, 10.0, 11.0, 7.0, 13.0, 15.0, 13.0, 23.0, 19.0, 34.0, 38.0, 34.0, 41.0, 43.0, 35.0, 57.0, 45.0, 50.0, 47.0, 41.0, 40.0, 40.0, 42.0, 44.0, 25.0, 32.0, 30.0, 33.0, 24.0, 12.0, 19.0, 11.0, 13.0, 7.0, 4.0, 6.0, 3.0, 10.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.796760559082031, -8.49354362487793, -8.190325736999512, -7.88710880279541, -7.58389139175415, -7.280673980712891, -6.977457046508789, -6.674239635467529, -6.3710222244262695, -6.06780481338501, -5.76458740234375, -5.461370468139648, -5.158153057098389, -4.854935646057129, -4.551718711853027, -4.248501300811768, -3.945283889770508, -3.642066478729248, -3.3388493061065674, -3.0356321334838867, -2.732414722442627, -2.429197311401367, -2.1259801387786865, -1.8227629661560059, -1.519545555114746, -1.2163282632827759, -0.9131109714508057, -0.6098936796188354, -0.30667638778686523, -0.0034590959548950195, 0.2997581958770752, 0.6029753684997559, 0.9061927795410156, 1.2094100713729858, 1.512627363204956, 1.8158446550369263, 2.1190619468688965, 2.4222793579101562, 2.725496530532837, 3.0287137031555176, 3.3319311141967773, 3.635148525238037, 3.9383656978607178, 4.241582870483398, 4.544800281524658, 4.848017692565918, 5.1512346267700195, 5.454452037811279, 5.757669448852539, 6.060886859893799, 6.364104270935059, 6.66732120513916, 6.97053861618042, 7.27375602722168, 7.576972961425781, 7.880190372467041, 8.1834077835083, 8.486624717712402, 8.78984260559082, 9.093059539794922, 9.396276473999023, 9.699494361877441, 10.002711296081543, 10.305929183959961, 10.609146118164062]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 16.0, 9.0, 22.0, 16.0, 25.0, 35.0, 44.0, 58.0, 95.0, 142.0, 208.0, 341.0, 487.0, 846.0, 1272.0, 2099.0, 3503.0, 6153.0, 10807.0, 20095.0, 37815.0, 74923.0, 158507.0, 377364.0, 1364563.0, 1430068.0, 380894.0, 161200.0, 76448.0, 38372.0, 20544.0, 11361.0, 6391.0, 3680.0, 2206.0, 1323.0, 808.0, 508.0, 294.0, 205.0, 158.0, 113.0, 81.0, 62.0, 30.0, 23.0, 22.0, 16.0, 12.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.2119140625, -1.1740570068359375, -1.136199951171875, -1.0983428955078125, -1.06048583984375, -1.0226287841796875, -0.984771728515625, -0.9469146728515625, -0.9090576171875, -0.8712005615234375, -0.833343505859375, -0.7954864501953125, -0.75762939453125, -0.7197723388671875, -0.681915283203125, -0.6440582275390625, -0.606201171875, -0.5683441162109375, -0.530487060546875, -0.4926300048828125, -0.45477294921875, -0.4169158935546875, -0.379058837890625, -0.3412017822265625, -0.3033447265625, -0.2654876708984375, -0.227630615234375, -0.1897735595703125, -0.15191650390625, -0.1140594482421875, -0.076202392578125, -0.0383453369140625, -0.00048828125, 0.0373687744140625, 0.075225830078125, 0.1130828857421875, 0.15093994140625, 0.1887969970703125, 0.226654052734375, 0.2645111083984375, 0.3023681640625, 0.3402252197265625, 0.378082275390625, 0.4159393310546875, 0.45379638671875, 0.4916534423828125, 0.529510498046875, 0.5673675537109375, 0.605224609375, 0.6430816650390625, 0.680938720703125, 0.7187957763671875, 0.75665283203125, 0.7945098876953125, 0.832366943359375, 0.8702239990234375, 0.9080810546875, 0.9459381103515625, 0.983795166015625, 1.0216522216796875, 1.05950927734375, 1.0973663330078125, 1.135223388671875, 1.1730804443359375, 1.2109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 6.0, 9.0, 1.0, 3.0, 14.0, 14.0, 6.0, 15.0, 14.0, 17.0, 25.0, 26.0, 26.0, 27.0, 34.0, 37.0, 55.0, 53.0, 52.0, 37.0, 45.0, 35.0, 43.0, 50.0, 33.0, 31.0, 34.0, 29.0, 32.0, 31.0, 23.0, 25.0, 18.0, 13.0, 18.0, 11.0, 10.0, 6.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-0.98486328125, -0.9564208984375, -0.927978515625, -0.8995361328125, -0.87109375, -0.8426513671875, -0.814208984375, -0.7857666015625, -0.75732421875, -0.7288818359375, -0.700439453125, -0.6719970703125, -0.6435546875, -0.6151123046875, -0.586669921875, -0.5582275390625, -0.52978515625, -0.5013427734375, -0.472900390625, -0.4444580078125, -0.416015625, -0.3875732421875, -0.359130859375, -0.3306884765625, -0.30224609375, -0.2738037109375, -0.245361328125, -0.2169189453125, -0.1884765625, -0.1600341796875, -0.131591796875, -0.1031494140625, -0.07470703125, -0.0462646484375, -0.017822265625, 0.0106201171875, 0.0390625, 0.0675048828125, 0.095947265625, 0.1243896484375, 0.15283203125, 0.1812744140625, 0.209716796875, 0.2381591796875, 0.2666015625, 0.2950439453125, 0.323486328125, 0.3519287109375, 0.38037109375, 0.4088134765625, 0.437255859375, 0.4656982421875, 0.494140625, 0.5225830078125, 0.551025390625, 0.5794677734375, 0.60791015625, 0.6363525390625, 0.664794921875, 0.6932373046875, 0.7216796875, 0.7501220703125, 0.778564453125, 0.8070068359375, 0.83544921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 5.0, 6.0, 8.0, 9.0, 11.0, 8.0, 20.0, 20.0, 27.0, 38.0, 50.0, 79.0, 120.0, 259.0, 618.0, 1524.0, 5149.0, 26828.0, 229210.0, 3078198.0, 770826.0, 66470.0, 10455.0, 2567.0, 935.0, 337.0, 163.0, 96.0, 50.0, 45.0, 22.0, 20.0, 11.0, 18.0, 21.0, 6.0, 9.0, 9.0, 7.0, 4.0, 5.0, 0.0, 1.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9140625, -5.7276611328125, -5.541259765625, -5.3548583984375, -5.16845703125, -4.9820556640625, -4.795654296875, -4.6092529296875, -4.4228515625, -4.2364501953125, -4.050048828125, -3.8636474609375, -3.67724609375, -3.4908447265625, -3.304443359375, -3.1180419921875, -2.931640625, -2.7452392578125, -2.558837890625, -2.3724365234375, -2.18603515625, -1.9996337890625, -1.813232421875, -1.6268310546875, -1.4404296875, -1.2540283203125, -1.067626953125, -0.8812255859375, -0.69482421875, -0.5084228515625, -0.322021484375, -0.1356201171875, 0.05078125, 0.2371826171875, 0.423583984375, 0.6099853515625, 0.79638671875, 0.9827880859375, 1.169189453125, 1.3555908203125, 1.5419921875, 1.7283935546875, 1.914794921875, 2.1011962890625, 2.28759765625, 2.4739990234375, 2.660400390625, 2.8468017578125, 3.033203125, 3.2196044921875, 3.406005859375, 3.5924072265625, 3.77880859375, 3.9652099609375, 4.151611328125, 4.3380126953125, 4.5244140625, 4.7108154296875, 4.897216796875, 5.0836181640625, 5.27001953125, 5.4564208984375, 5.642822265625, 5.8292236328125, 6.015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 10.0, 33.0, 68.0, 112.0, 236.0, 489.0, 1284.0, 912.0, 452.0, 226.0, 130.0, 55.0, 32.0, 22.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.91796875, -6.7763671875, -6.634765625, -6.4931640625, -6.3515625, -6.2099609375, -6.068359375, -5.9267578125, -5.78515625, -5.6435546875, -5.501953125, -5.3603515625, -5.21875, -5.0771484375, -4.935546875, -4.7939453125, -4.65234375, -4.5107421875, -4.369140625, -4.2275390625, -4.0859375, -3.9443359375, -3.802734375, -3.6611328125, -3.51953125, -3.3779296875, -3.236328125, -3.0947265625, -2.953125, -2.8115234375, -2.669921875, -2.5283203125, -2.38671875, -2.2451171875, -2.103515625, -1.9619140625, -1.8203125, -1.6787109375, -1.537109375, -1.3955078125, -1.25390625, -1.1123046875, -0.970703125, -0.8291015625, -0.6875, -0.5458984375, -0.404296875, -0.2626953125, -0.12109375, 0.0205078125, 0.162109375, 0.3037109375, 0.4453125, 0.5869140625, 0.728515625, 0.8701171875, 1.01171875, 1.1533203125, 1.294921875, 1.4365234375, 1.578125, 1.7197265625, 1.861328125, 2.0029296875, 2.14453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 4.0, 0.0, 8.0, 13.0, 16.0, 30.0, 43.0, 55.0, 88.0, 95.0, 114.0, 118.0, 89.0, 87.0, 63.0, 62.0, 40.0, 27.0, 17.0, 21.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.139472961425781, -5.714046001434326, -5.288619518280029, -4.863192558288574, -4.437766075134277, -4.012339115142822, -3.5869123935699463, -3.1614856719970703, -2.7360589504241943, -2.3106322288513184, -1.8852055072784424, -1.4597786664962769, -1.0343519449234009, -0.6089251041412354, -0.18349838256835938, 0.2419283390045166, 0.6673550605773926, 1.0927817821502686, 1.5182085037231445, 1.94363534450531, 2.3690619468688965, 2.7944889068603516, 3.2199156284332275, 3.6453423500061035, 4.070769309997559, 4.496196269989014, 4.9216227531433105, 5.347049713134766, 5.7724761962890625, 6.197903156280518, 6.623330116271973, 7.0487565994262695, 7.474183082580566, 7.8996100425720215, 8.325037002563477, 8.750463485717773, 9.17588996887207, 9.601316452026367, 10.02674388885498, 10.452170372009277, 10.877596855163574, 11.303023338317871, 11.728450775146484, 12.153877258300781, 12.579303741455078, 13.004730224609375, 13.430157661437988, 13.855584144592285, 14.281011581420898, 14.706438064575195, 15.131865501403809, 15.557291984558105, 15.982718467712402, 16.408145904541016, 16.833572387695312, 17.25899887084961, 17.684425354003906, 18.109851837158203, 18.5352783203125, 18.960704803466797, 19.386133193969727, 19.811559677124023, 20.23698616027832, 20.662412643432617, 21.087839126586914]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 7.0, 6.0, 7.0, 13.0, 8.0, 15.0, 18.0, 13.0, 14.0, 12.0, 26.0, 32.0, 29.0, 16.0, 36.0, 45.0, 29.0, 33.0, 50.0, 38.0, 48.0, 36.0, 33.0, 36.0, 28.0, 27.0, 36.0, 29.0, 28.0, 22.0, 18.0, 23.0, 22.0, 23.0, 14.0, 16.0, 16.0, 15.0, 14.0, 13.0, 9.0, 4.0, 6.0, 9.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0], "bins": [-6.529906272888184, -6.333456039428711, -6.137005805969238, -5.940556049346924, -5.744105815887451, -5.5476555824279785, -5.351205825805664, -5.154755592346191, -4.958305358886719, -4.761855125427246, -4.565404891967773, -4.368955135345459, -4.172504901885986, -3.9760546684265137, -3.77960467338562, -3.5831546783447266, -3.386704444885254, -3.1902542114257812, -2.9938042163848877, -2.797354221343994, -2.6009039878845215, -2.404453754425049, -2.2080037593841553, -2.0115537643432617, -1.815103530883789, -1.618653416633606, -1.4222033023834229, -1.2257531881332397, -1.0293030738830566, -0.8328529596328735, -0.6364028453826904, -0.4399527311325073, -0.24350214004516602, -0.04705202579498291, 0.1493980884552002, 0.3458482027053833, 0.5422983169555664, 0.7387484312057495, 0.9351985454559326, 1.1316486597061157, 1.3280987739562988, 1.524548888206482, 1.720999002456665, 1.9174491167068481, 2.1138992309570312, 2.310349464416504, 2.5067994594573975, 2.703249454498291, 2.8996996879577637, 3.0961499214172363, 3.29259991645813, 3.4890499114990234, 3.685500144958496, 3.8819503784179688, 4.078400611877441, 4.274850368499756, 4.4713006019592285, 4.667750835418701, 4.864200592041016, 5.060650825500488, 5.257101058959961, 5.453551292419434, 5.650001525878906, 5.846451282501221, 6.042901515960693]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 10.0, 17.0, 19.0, 33.0, 57.0, 102.0, 130.0, 190.0, 302.0, 402.0, 669.0, 985.0, 1468.0, 2305.0, 3414.0, 5241.0, 8282.0, 12982.0, 20629.0, 34605.0, 62382.0, 119319.0, 211202.0, 233551.0, 146800.0, 76003.0, 41343.0, 24060.0, 14887.0, 9589.0, 6146.0, 3970.0, 2625.0, 1638.0, 1038.0, 726.0, 487.0, 303.0, 201.0, 155.0, 99.0, 57.0, 51.0, 25.0, 15.0, 10.0, 5.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2294921875, -1.188720703125, -1.14794921875, -1.107177734375, -1.06640625, -1.025634765625, -0.98486328125, -0.944091796875, -0.9033203125, -0.862548828125, -0.82177734375, -0.781005859375, -0.740234375, -0.699462890625, -0.65869140625, -0.617919921875, -0.5771484375, -0.536376953125, -0.49560546875, -0.454833984375, -0.4140625, -0.373291015625, -0.33251953125, -0.291748046875, -0.2509765625, -0.210205078125, -0.16943359375, -0.128662109375, -0.087890625, -0.047119140625, -0.00634765625, 0.034423828125, 0.0751953125, 0.115966796875, 0.15673828125, 0.197509765625, 0.23828125, 0.279052734375, 0.31982421875, 0.360595703125, 0.4013671875, 0.442138671875, 0.48291015625, 0.523681640625, 0.564453125, 0.605224609375, 0.64599609375, 0.686767578125, 0.7275390625, 0.768310546875, 0.80908203125, 0.849853515625, 0.890625, 0.931396484375, 0.97216796875, 1.012939453125, 1.0537109375, 1.094482421875, 1.13525390625, 1.176025390625, 1.216796875, 1.257568359375, 1.29833984375, 1.339111328125, 1.3798828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 11.0, 11.0, 15.0, 17.0, 13.0, 19.0, 16.0, 26.0, 35.0, 37.0, 43.0, 42.0, 41.0, 56.0, 46.0, 40.0, 47.0, 45.0, 48.0, 43.0, 34.0, 36.0, 44.0, 25.0, 28.0, 26.0, 27.0, 14.0, 16.0, 17.0, 14.0, 10.0, 7.0, 8.0, 4.0, 12.0, 3.0, 5.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.267578125, -1.23101806640625, -1.1944580078125, -1.15789794921875, -1.121337890625, -1.08477783203125, -1.0482177734375, -1.01165771484375, -0.97509765625, -0.93853759765625, -0.9019775390625, -0.86541748046875, -0.828857421875, -0.79229736328125, -0.7557373046875, -0.71917724609375, -0.6826171875, -0.64605712890625, -0.6094970703125, -0.57293701171875, -0.536376953125, -0.49981689453125, -0.4632568359375, -0.42669677734375, -0.39013671875, -0.35357666015625, -0.3170166015625, -0.28045654296875, -0.243896484375, -0.20733642578125, -0.1707763671875, -0.13421630859375, -0.09765625, -0.06109619140625, -0.0245361328125, 0.01202392578125, 0.048583984375, 0.08514404296875, 0.1217041015625, 0.15826416015625, 0.19482421875, 0.23138427734375, 0.2679443359375, 0.30450439453125, 0.341064453125, 0.37762451171875, 0.4141845703125, 0.45074462890625, 0.4873046875, 0.52386474609375, 0.5604248046875, 0.59698486328125, 0.633544921875, 0.67010498046875, 0.7066650390625, 0.74322509765625, 0.77978515625, 0.81634521484375, 0.8529052734375, 0.88946533203125, 0.926025390625, 0.96258544921875, 0.9991455078125, 1.03570556640625, 1.072265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 14.0, 13.0, 13.0, 13.0, 26.0, 23.0, 37.0, 61.0, 107.0, 261.0, 625.0, 1753.0, 5108.0, 18257.0, 80114.0, 519118.0, 350411.0, 53164.0, 13235.0, 3896.0, 1343.0, 463.0, 179.0, 94.0, 51.0, 28.0, 18.0, 23.0, 23.0, 14.0, 7.0, 7.0, 9.0, 8.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.20684814453125, -4.0660400390625, -3.92523193359375, -3.784423828125, -3.64361572265625, -3.5028076171875, -3.36199951171875, -3.22119140625, -3.08038330078125, -2.9395751953125, -2.79876708984375, -2.657958984375, -2.51715087890625, -2.3763427734375, -2.23553466796875, -2.0947265625, -1.95391845703125, -1.8131103515625, -1.67230224609375, -1.531494140625, -1.39068603515625, -1.2498779296875, -1.10906982421875, -0.96826171875, -0.82745361328125, -0.6866455078125, -0.54583740234375, -0.405029296875, -0.26422119140625, -0.1234130859375, 0.01739501953125, 0.158203125, 0.29901123046875, 0.4398193359375, 0.58062744140625, 0.721435546875, 0.86224365234375, 1.0030517578125, 1.14385986328125, 1.28466796875, 1.42547607421875, 1.5662841796875, 1.70709228515625, 1.847900390625, 1.98870849609375, 2.1295166015625, 2.27032470703125, 2.4111328125, 2.55194091796875, 2.6927490234375, 2.83355712890625, 2.974365234375, 3.11517333984375, 3.2559814453125, 3.39678955078125, 3.53759765625, 3.67840576171875, 3.8192138671875, 3.96002197265625, 4.100830078125, 4.24163818359375, 4.3824462890625, 4.52325439453125, 4.6640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 4.0, 4.0, 8.0, 7.0, 9.0, 8.0, 12.0, 12.0, 21.0, 22.0, 20.0, 33.0, 31.0, 35.0, 45.0, 49.0, 42.0, 41.0, 56.0, 55.0, 42.0, 48.0, 43.0, 49.0, 50.0, 48.0, 37.0, 29.0, 27.0, 21.0, 22.0, 14.0, 10.0, 11.0, 11.0, 10.0, 4.0, 6.0, 6.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.724609375, -3.6060791015625, -3.487548828125, -3.3690185546875, -3.25048828125, -3.1319580078125, -3.013427734375, -2.8948974609375, -2.7763671875, -2.6578369140625, -2.539306640625, -2.4207763671875, -2.30224609375, -2.1837158203125, -2.065185546875, -1.9466552734375, -1.828125, -1.7095947265625, -1.591064453125, -1.4725341796875, -1.35400390625, -1.2354736328125, -1.116943359375, -0.9984130859375, -0.8798828125, -0.7613525390625, -0.642822265625, -0.5242919921875, -0.40576171875, -0.2872314453125, -0.168701171875, -0.0501708984375, 0.068359375, 0.1868896484375, 0.305419921875, 0.4239501953125, 0.54248046875, 0.6610107421875, 0.779541015625, 0.8980712890625, 1.0166015625, 1.1351318359375, 1.253662109375, 1.3721923828125, 1.49072265625, 1.6092529296875, 1.727783203125, 1.8463134765625, 1.96484375, 2.0833740234375, 2.201904296875, 2.3204345703125, 2.43896484375, 2.5574951171875, 2.676025390625, 2.7945556640625, 2.9130859375, 3.0316162109375, 3.150146484375, 3.2686767578125, 3.38720703125, 3.5057373046875, 3.624267578125, 3.7427978515625, 3.861328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 12.0, 8.0, 10.0, 17.0, 33.0, 26.0, 32.0, 54.0, 71.0, 94.0, 136.0, 206.0, 318.0, 491.0, 779.0, 1464.0, 3167.0, 7598.0, 21761.0, 67224.0, 274058.0, 488721.0, 123806.0, 36410.0, 12399.0, 4655.0, 2134.0, 1026.0, 590.0, 387.0, 231.0, 174.0, 130.0, 89.0, 62.0, 49.0, 29.0, 23.0, 21.0, 11.0, 15.0, 8.0, 8.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7216796875, -1.66656494140625, -1.6114501953125, -1.55633544921875, -1.501220703125, -1.44610595703125, -1.3909912109375, -1.33587646484375, -1.28076171875, -1.22564697265625, -1.1705322265625, -1.11541748046875, -1.060302734375, -1.00518798828125, -0.9500732421875, -0.89495849609375, -0.83984375, -0.78472900390625, -0.7296142578125, -0.67449951171875, -0.619384765625, -0.56427001953125, -0.5091552734375, -0.45404052734375, -0.39892578125, -0.34381103515625, -0.2886962890625, -0.23358154296875, -0.178466796875, -0.12335205078125, -0.0682373046875, -0.01312255859375, 0.0419921875, 0.09710693359375, 0.1522216796875, 0.20733642578125, 0.262451171875, 0.31756591796875, 0.3726806640625, 0.42779541015625, 0.48291015625, 0.53802490234375, 0.5931396484375, 0.64825439453125, 0.703369140625, 0.75848388671875, 0.8135986328125, 0.86871337890625, 0.923828125, 0.97894287109375, 1.0340576171875, 1.08917236328125, 1.144287109375, 1.19940185546875, 1.2545166015625, 1.30963134765625, 1.36474609375, 1.41986083984375, 1.4749755859375, 1.53009033203125, 1.585205078125, 1.64031982421875, 1.6954345703125, 1.75054931640625, 1.8056640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 5.0, 5.0, 12.0, 12.0, 8.0, 23.0, 35.0, 27.0, 64.0, 118.0, 188.0, 171.0, 119.0, 78.0, 38.0, 35.0, 22.0, 16.0, 8.0, 10.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0005817413330078125, -0.0005691144615411758, -0.0005564875900745392, -0.0005438607186079025, -0.0005312338471412659, -0.0005186069756746292, -0.0005059801042079926, -0.0004933532327413559, -0.00048072636127471924, -0.0004680994898080826, -0.0004554726183414459, -0.00044284574687480927, -0.0004302188754081726, -0.00041759200394153595, -0.0004049651324748993, -0.00039233826100826263, -0.000379711389541626, -0.0003670845180749893, -0.00035445764660835266, -0.000341830775141716, -0.00032920390367507935, -0.0003165770322084427, -0.00030395016074180603, -0.00029132328927516937, -0.0002786964178085327, -0.00026606954634189606, -0.0002534426748752594, -0.00024081580340862274, -0.00022818893194198608, -0.00021556206047534943, -0.00020293518900871277, -0.0001903083175420761, -0.00017768144607543945, -0.0001650545746088028, -0.00015242770314216614, -0.00013980083167552948, -0.00012717396020889282, -0.00011454708874225616, -0.00010192021727561951, -8.929334580898285e-05, -7.666647434234619e-05, -6.403960287570953e-05, -5.1412731409072876e-05, -3.878585994243622e-05, -2.615898847579956e-05, -1.3532117009162903e-05, -9.052455425262451e-07, 1.1721625924110413e-05, 2.434849739074707e-05, 3.697536885738373e-05, 4.9602240324020386e-05, 6.222911179065704e-05, 7.48559832572937e-05, 8.748285472393036e-05, 0.00010010972619056702, 0.00011273659765720367, 0.00012536346912384033, 0.000137990340590477, 0.00015061721205711365, 0.0001632440835237503, 0.00017587095499038696, 0.00018849782645702362, 0.00020112469792366028, 0.00021375156939029694, 0.0002263784408569336]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 7.0, 8.0, 11.0, 9.0, 12.0, 17.0, 23.0, 32.0, 43.0, 89.0, 82.0, 122.0, 218.0, 362.0, 626.0, 1098.0, 2084.0, 4228.0, 9330.0, 22092.0, 56180.0, 167631.0, 450709.0, 216636.0, 68792.0, 26621.0, 11105.0, 4917.0, 2408.0, 1251.0, 644.0, 380.0, 248.0, 159.0, 116.0, 72.0, 50.0, 34.0, 23.0, 23.0, 15.0, 16.0, 12.0, 4.0, 6.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3125, -1.2696075439453125, -1.226715087890625, -1.1838226318359375, -1.14093017578125, -1.0980377197265625, -1.055145263671875, -1.0122528076171875, -0.9693603515625, -0.9264678955078125, -0.883575439453125, -0.8406829833984375, -0.79779052734375, -0.7548980712890625, -0.712005615234375, -0.6691131591796875, -0.626220703125, -0.5833282470703125, -0.540435791015625, -0.4975433349609375, -0.45465087890625, -0.4117584228515625, -0.368865966796875, -0.3259735107421875, -0.2830810546875, -0.2401885986328125, -0.197296142578125, -0.1544036865234375, -0.11151123046875, -0.0686187744140625, -0.025726318359375, 0.0171661376953125, 0.06005859375, 0.1029510498046875, 0.145843505859375, 0.1887359619140625, 0.23162841796875, 0.2745208740234375, 0.317413330078125, 0.3603057861328125, 0.4031982421875, 0.4460906982421875, 0.488983154296875, 0.5318756103515625, 0.57476806640625, 0.6176605224609375, 0.660552978515625, 0.7034454345703125, 0.746337890625, 0.7892303466796875, 0.832122802734375, 0.8750152587890625, 0.91790771484375, 0.9608001708984375, 1.003692626953125, 1.0465850830078125, 1.0894775390625, 1.1323699951171875, 1.175262451171875, 1.2181549072265625, 1.26104736328125, 1.3039398193359375, 1.346832275390625, 1.3897247314453125, 1.4326171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 2.0, 8.0, 9.0, 11.0, 17.0, 13.0, 28.0, 20.0, 38.0, 39.0, 67.0, 84.0, 105.0, 108.0, 106.0, 88.0, 50.0, 44.0, 35.0, 29.0, 19.0, 15.0, 8.0, 11.0, 9.0, 9.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.2639007568359375, -1.225067138671875, -1.1862335205078125, -1.14739990234375, -1.1085662841796875, -1.069732666015625, -1.0308990478515625, -0.9920654296875, -0.9532318115234375, -0.914398193359375, -0.8755645751953125, -0.83673095703125, -0.7978973388671875, -0.759063720703125, -0.7202301025390625, -0.681396484375, -0.6425628662109375, -0.603729248046875, -0.5648956298828125, -0.52606201171875, -0.4872283935546875, -0.448394775390625, -0.4095611572265625, -0.3707275390625, -0.3318939208984375, -0.293060302734375, -0.2542266845703125, -0.21539306640625, -0.1765594482421875, -0.137725830078125, -0.0988922119140625, -0.06005859375, -0.0212249755859375, 0.017608642578125, 0.0564422607421875, 0.09527587890625, 0.1341094970703125, 0.172943115234375, 0.2117767333984375, 0.2506103515625, 0.2894439697265625, 0.328277587890625, 0.3671112060546875, 0.40594482421875, 0.4447784423828125, 0.483612060546875, 0.5224456787109375, 0.561279296875, 0.6001129150390625, 0.638946533203125, 0.6777801513671875, 0.71661376953125, 0.7554473876953125, 0.794281005859375, 0.8331146240234375, 0.8719482421875, 0.9107818603515625, 0.949615478515625, 0.9884490966796875, 1.02728271484375, 1.0661163330078125, 1.104949951171875, 1.1437835693359375, 1.1826171875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 18.0, 34.0, 55.0, 97.0, 103.0, 142.0, 153.0, 135.0, 94.0, 72.0, 41.0, 30.0, 12.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.198183059692383, -18.63956642150879, -18.080949783325195, -17.5223331451416, -16.963716506958008, -16.405101776123047, -15.846484184265137, -15.287867546081543, -14.729251861572266, -14.170635223388672, -13.612018585205078, -13.053401947021484, -12.494786262512207, -11.936169624328613, -11.37755298614502, -10.818936347961426, -10.260319709777832, -9.701703071594238, -9.143086433410645, -8.584470748901367, -8.025854110717773, -7.46723747253418, -6.908620834350586, -6.350004196166992, -5.791388034820557, -5.232771396636963, -4.674155235290527, -4.115538597106934, -3.556922197341919, -2.9983057975769043, -2.4396891593933105, -1.881072759628296, -1.3224563598632812, -0.7638399004936218, -0.2052234411239624, 0.3533930778503418, 0.9120094776153564, 1.470625877380371, 2.029242515563965, 2.5878589153289795, 3.146475315093994, 3.705091714859009, 4.263708114624023, 4.822324752807617, 5.380941390991211, 5.9395575523376465, 6.49817419052124, 7.056790351867676, 7.6154069900512695, 8.174023628234863, 8.732640266418457, 9.291255950927734, 9.849872589111328, 10.408489227294922, 10.967105865478516, 11.52572250366211, 12.084339141845703, 12.642955780029297, 13.20157241821289, 13.760189056396484, 14.318804740905762, 14.877421379089355, 15.43603801727295, 15.994654655456543, 16.55327033996582]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 8.0, 9.0, 8.0, 8.0, 10.0, 19.0, 18.0, 22.0, 22.0, 27.0, 30.0, 41.0, 26.0, 32.0, 36.0, 50.0, 37.0, 39.0, 32.0, 40.0, 42.0, 38.0, 33.0, 42.0, 25.0, 28.0, 33.0, 27.0, 28.0, 26.0, 26.0, 15.0, 16.0, 15.0, 10.0, 17.0, 7.0, 6.0, 12.0, 10.0, 6.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.37156867980957, -9.097650527954102, -8.823732376098633, -8.54981517791748, -8.275897026062012, -8.001978874206543, -7.728060722351074, -7.4541425704956055, -7.180224895477295, -6.906306743621826, -6.632389068603516, -6.358470916748047, -6.084552764892578, -5.810635089874268, -5.536716938018799, -5.262799263000488, -4.9888811111450195, -4.714962959289551, -4.44104528427124, -4.1671271324157715, -3.893209218978882, -3.619291305541992, -3.3453731536865234, -3.071455240249634, -2.797537326812744, -2.5236194133758545, -2.249701499938965, -1.975783348083496, -1.7018654346466064, -1.4279475212097168, -1.1540294885635376, -0.8801114559173584, -0.6061944961547852, -0.33227652311325073, -0.05835855007171631, 0.21555942296981812, 0.48947739601135254, 0.7633953094482422, 1.0373133420944214, 1.3112313747406006, 1.5851492881774902, 1.8590672016143799, 2.1329851150512695, 2.4069032669067383, 2.680821180343628, 2.9547390937805176, 3.2286572456359863, 3.502575159072876, 3.7764930725097656, 4.050411224365234, 4.324328899383545, 4.598247051239014, 4.872164726257324, 5.146082878112793, 5.420001029968262, 5.6939191818237305, 5.967836856842041, 6.24175500869751, 6.51567268371582, 6.789590835571289, 7.063508987426758, 7.337426662445068, 7.611344814300537, 7.885262489318848, 8.159180641174316]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 12.0, 18.0, 25.0, 26.0, 51.0, 70.0, 101.0, 169.0, 314.0, 486.0, 818.0, 1404.0, 2627.0, 5059.0, 10714.0, 23999.0, 59414.0, 170632.0, 645969.0, 2336788.0, 654909.0, 174114.0, 60732.0, 24413.0, 10536.0, 4957.0, 2518.0, 1422.0, 747.0, 461.0, 271.0, 165.0, 101.0, 57.0, 40.0, 33.0, 20.0, 20.0, 12.0, 11.0, 7.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.322265625, -2.250823974609375, -2.17938232421875, -2.107940673828125, -2.0364990234375, -1.965057373046875, -1.89361572265625, -1.822174072265625, -1.750732421875, -1.679290771484375, -1.60784912109375, -1.536407470703125, -1.4649658203125, -1.393524169921875, -1.32208251953125, -1.250640869140625, -1.17919921875, -1.107757568359375, -1.03631591796875, -0.964874267578125, -0.8934326171875, -0.821990966796875, -0.75054931640625, -0.679107666015625, -0.607666015625, -0.536224365234375, -0.46478271484375, -0.393341064453125, -0.3218994140625, -0.250457763671875, -0.17901611328125, -0.107574462890625, -0.0361328125, 0.035308837890625, 0.10675048828125, 0.178192138671875, 0.2496337890625, 0.321075439453125, 0.39251708984375, 0.463958740234375, 0.535400390625, 0.606842041015625, 0.67828369140625, 0.749725341796875, 0.8211669921875, 0.892608642578125, 0.96405029296875, 1.035491943359375, 1.10693359375, 1.178375244140625, 1.24981689453125, 1.321258544921875, 1.3927001953125, 1.464141845703125, 1.53558349609375, 1.607025146484375, 1.678466796875, 1.749908447265625, 1.82135009765625, 1.892791748046875, 1.9642333984375, 2.035675048828125, 2.10711669921875, 2.178558349609375, 2.25]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 7.0, 2.0, 3.0, 8.0, 14.0, 9.0, 12.0, 17.0, 17.0, 18.0, 32.0, 34.0, 31.0, 28.0, 35.0, 40.0, 36.0, 43.0, 42.0, 34.0, 48.0, 43.0, 51.0, 35.0, 46.0, 39.0, 35.0, 34.0, 33.0, 37.0, 23.0, 23.0, 15.0, 20.0, 17.0, 8.0, 5.0, 5.0, 5.0, 4.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.1904296875, -1.1539306640625, -1.117431640625, -1.0809326171875, -1.04443359375, -1.0079345703125, -0.971435546875, -0.9349365234375, -0.8984375, -0.8619384765625, -0.825439453125, -0.7889404296875, -0.75244140625, -0.7159423828125, -0.679443359375, -0.6429443359375, -0.6064453125, -0.5699462890625, -0.533447265625, -0.4969482421875, -0.46044921875, -0.4239501953125, -0.387451171875, -0.3509521484375, -0.314453125, -0.2779541015625, -0.241455078125, -0.2049560546875, -0.16845703125, -0.1319580078125, -0.095458984375, -0.0589599609375, -0.0224609375, 0.0140380859375, 0.050537109375, 0.0870361328125, 0.12353515625, 0.1600341796875, 0.196533203125, 0.2330322265625, 0.26953125, 0.3060302734375, 0.342529296875, 0.3790283203125, 0.41552734375, 0.4520263671875, 0.488525390625, 0.5250244140625, 0.5615234375, 0.5980224609375, 0.634521484375, 0.6710205078125, 0.70751953125, 0.7440185546875, 0.780517578125, 0.8170166015625, 0.853515625, 0.8900146484375, 0.926513671875, 0.9630126953125, 0.99951171875, 1.0360107421875, 1.072509765625, 1.1090087890625, 1.1455078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 8.0, 16.0, 17.0, 15.0, 28.0, 39.0, 42.0, 55.0, 77.0, 127.0, 182.0, 264.0, 485.0, 851.0, 1714.0, 3660.0, 8697.0, 24233.0, 80693.0, 355768.0, 2442464.0, 1029633.0, 173500.0, 45314.0, 14942.0, 5832.0, 2585.0, 1243.0, 663.0, 368.0, 233.0, 164.0, 111.0, 64.0, 61.0, 31.0, 27.0, 16.0, 17.0, 10.0, 8.0, 8.0, 5.0, 3.0, 1.0, 4.0, 5.0, 1.0], "bins": [-4.875, -4.742431640625, -4.60986328125, -4.477294921875, -4.3447265625, -4.212158203125, -4.07958984375, -3.947021484375, -3.814453125, -3.681884765625, -3.54931640625, -3.416748046875, -3.2841796875, -3.151611328125, -3.01904296875, -2.886474609375, -2.75390625, -2.621337890625, -2.48876953125, -2.356201171875, -2.2236328125, -2.091064453125, -1.95849609375, -1.825927734375, -1.693359375, -1.560791015625, -1.42822265625, -1.295654296875, -1.1630859375, -1.030517578125, -0.89794921875, -0.765380859375, -0.6328125, -0.500244140625, -0.36767578125, -0.235107421875, -0.1025390625, 0.030029296875, 0.16259765625, 0.295166015625, 0.427734375, 0.560302734375, 0.69287109375, 0.825439453125, 0.9580078125, 1.090576171875, 1.22314453125, 1.355712890625, 1.48828125, 1.620849609375, 1.75341796875, 1.885986328125, 2.0185546875, 2.151123046875, 2.28369140625, 2.416259765625, 2.548828125, 2.681396484375, 2.81396484375, 2.946533203125, 3.0791015625, 3.211669921875, 3.34423828125, 3.476806640625, 3.609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 11.0, 18.0, 28.0, 42.0, 71.0, 62.0, 124.0, 222.0, 338.0, 617.0, 948.0, 615.0, 363.0, 221.0, 129.0, 76.0, 53.0, 31.0, 36.0, 13.0, 18.0, 11.0, 4.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.941162109375, -3.81201171875, -3.682861328125, -3.5537109375, -3.424560546875, -3.29541015625, -3.166259765625, -3.037109375, -2.907958984375, -2.77880859375, -2.649658203125, -2.5205078125, -2.391357421875, -2.26220703125, -2.133056640625, -2.00390625, -1.874755859375, -1.74560546875, -1.616455078125, -1.4873046875, -1.358154296875, -1.22900390625, -1.099853515625, -0.970703125, -0.841552734375, -0.71240234375, -0.583251953125, -0.4541015625, -0.324951171875, -0.19580078125, -0.066650390625, 0.0625, 0.191650390625, 0.32080078125, 0.449951171875, 0.5791015625, 0.708251953125, 0.83740234375, 0.966552734375, 1.095703125, 1.224853515625, 1.35400390625, 1.483154296875, 1.6123046875, 1.741455078125, 1.87060546875, 1.999755859375, 2.12890625, 2.258056640625, 2.38720703125, 2.516357421875, 2.6455078125, 2.774658203125, 2.90380859375, 3.032958984375, 3.162109375, 3.291259765625, 3.42041015625, 3.549560546875, 3.6787109375, 3.807861328125, 3.93701171875, 4.066162109375, 4.1953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 8.0, 3.0, 8.0, 17.0, 24.0, 31.0, 34.0, 35.0, 34.0, 48.0, 52.0, 64.0, 56.0, 70.0, 76.0, 59.0, 55.0, 48.0, 41.0, 37.0, 38.0, 32.0, 20.0, 18.0, 13.0, 11.0, 17.0, 8.0, 10.0, 3.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.299647331237793, -10.990974426269531, -10.682300567626953, -10.373627662658691, -10.06495475769043, -9.756280899047852, -9.44760799407959, -9.138935089111328, -8.83026123046875, -8.521588325500488, -8.21291446685791, -7.904241561889648, -7.5955681800842285, -7.286894798278809, -6.978221893310547, -6.669548511505127, -6.360875606536865, -6.052202224731445, -5.743529319763184, -5.434855937957764, -5.126182556152344, -4.817509651184082, -4.508836269378662, -4.200162887573242, -3.8914897441864014, -3.5828166007995605, -3.2741432189941406, -2.9654700756073, -2.656796932220459, -2.348123550415039, -2.0394504070281982, -1.7307770252227783, -1.4221038818359375, -1.1134306192398071, -0.8047574162483215, -0.49608421325683594, -0.18741095066070557, 0.1212623119354248, 0.4299354553222656, 0.7386088371276855, 1.0472819805145264, 1.3559552431106567, 1.664628505706787, 1.973301649093628, 2.2819747924804688, 2.5906481742858887, 2.8993213176727295, 3.2079946994781494, 3.5166678428649902, 3.825340986251831, 4.134014129638672, 4.442687511444092, 4.751360893249512, 5.060033798217773, 5.368707180023193, 5.677380561828613, 5.986053466796875, 6.294726848602295, 6.603399753570557, 6.912073135375977, 7.2207465171813965, 7.529419898986816, 7.838092803955078, 8.146766662597656, 8.455439567565918]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 4.0, 14.0, 11.0, 16.0, 19.0, 18.0, 15.0, 17.0, 20.0, 19.0, 21.0, 23.0, 32.0, 37.0, 27.0, 24.0, 27.0, 36.0, 35.0, 36.0, 32.0, 26.0, 28.0, 32.0, 38.0, 35.0, 36.0, 23.0, 23.0, 24.0, 30.0, 30.0, 11.0, 21.0, 25.0, 18.0, 11.0, 22.0, 14.0, 6.0, 6.0, 7.0, 5.0, 9.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.652467727661133, -7.411046504974365, -7.1696248054504395, -6.928203582763672, -6.686781883239746, -6.4453606605529785, -6.203939437866211, -5.962517738342285, -5.721096038818359, -5.479674816131592, -5.238253116607666, -4.996831893920898, -4.755410194396973, -4.513988971710205, -4.2725677490234375, -4.031146049499512, -3.789724826812744, -3.5483033657073975, -3.306881904602051, -3.065460681915283, -2.8240389823913574, -2.58261775970459, -2.341196298599243, -2.0997748374938965, -1.8583533763885498, -1.6169319152832031, -1.3755104541778564, -1.1340891122817993, -0.8926676511764526, -0.651246190071106, -0.40982484817504883, -0.16840338706970215, 0.07301759719848633, 0.3144390285015106, 0.5558604598045349, 0.7972818613052368, 1.0387033224105835, 1.2801247835159302, 1.5215461254119873, 1.762967586517334, 2.0043890476226807, 2.2458105087280273, 2.487231969833374, 2.7286534309387207, 2.9700746536254883, 3.211496353149414, 3.4529175758361816, 3.6943390369415283, 3.935760498046875, 4.177181720733643, 4.418603420257568, 4.660024642944336, 4.901446342468262, 5.142867565155029, 5.384288787841797, 5.625710487365723, 5.867132186889648, 6.108553409576416, 6.349975109100342, 6.591396331787109, 6.832818031311035, 7.074239253997803, 7.31566047668457, 7.557082176208496, 7.798503398895264]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 9.0, 21.0, 23.0, 37.0, 59.0, 113.0, 137.0, 244.0, 416.0, 646.0, 1159.0, 2089.0, 3633.0, 6429.0, 11315.0, 20205.0, 38265.0, 80960.0, 201620.0, 349725.0, 179725.0, 72945.0, 35818.0, 18762.0, 10522.0, 5836.0, 3357.0, 1852.0, 1032.0, 623.0, 330.0, 251.0, 150.0, 70.0, 67.0, 42.0, 16.0, 17.0, 14.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48046875, -2.396209716796875, -2.31195068359375, -2.227691650390625, -2.1434326171875, -2.059173583984375, -1.97491455078125, -1.890655517578125, -1.806396484375, -1.722137451171875, -1.63787841796875, -1.553619384765625, -1.4693603515625, -1.385101318359375, -1.30084228515625, -1.216583251953125, -1.13232421875, -1.048065185546875, -0.96380615234375, -0.879547119140625, -0.7952880859375, -0.711029052734375, -0.62677001953125, -0.542510986328125, -0.458251953125, -0.373992919921875, -0.28973388671875, -0.205474853515625, -0.1212158203125, -0.036956787109375, 0.04730224609375, 0.131561279296875, 0.2158203125, 0.300079345703125, 0.38433837890625, 0.468597412109375, 0.5528564453125, 0.637115478515625, 0.72137451171875, 0.805633544921875, 0.889892578125, 0.974151611328125, 1.05841064453125, 1.142669677734375, 1.2269287109375, 1.311187744140625, 1.39544677734375, 1.479705810546875, 1.56396484375, 1.648223876953125, 1.73248291015625, 1.816741943359375, 1.9010009765625, 1.985260009765625, 2.06951904296875, 2.153778076171875, 2.238037109375, 2.322296142578125, 2.40655517578125, 2.490814208984375, 2.5750732421875, 2.659332275390625, 2.74359130859375, 2.827850341796875, 2.912109375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 7.0, 9.0, 22.0, 9.0, 21.0, 21.0, 15.0, 25.0, 35.0, 25.0, 41.0, 44.0, 42.0, 48.0, 40.0, 52.0, 51.0, 36.0, 53.0, 40.0, 44.0, 34.0, 37.0, 30.0, 28.0, 30.0, 23.0, 19.0, 16.0, 10.0, 13.0, 15.0, 10.0, 12.0, 4.0, 11.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.33984375, -1.29876708984375, -1.2576904296875, -1.21661376953125, -1.175537109375, -1.13446044921875, -1.0933837890625, -1.05230712890625, -1.01123046875, -0.97015380859375, -0.9290771484375, -0.88800048828125, -0.846923828125, -0.80584716796875, -0.7647705078125, -0.72369384765625, -0.6826171875, -0.64154052734375, -0.6004638671875, -0.55938720703125, -0.518310546875, -0.47723388671875, -0.4361572265625, -0.39508056640625, -0.35400390625, -0.31292724609375, -0.2718505859375, -0.23077392578125, -0.189697265625, -0.14862060546875, -0.1075439453125, -0.06646728515625, -0.025390625, 0.01568603515625, 0.0567626953125, 0.09783935546875, 0.138916015625, 0.17999267578125, 0.2210693359375, 0.26214599609375, 0.30322265625, 0.34429931640625, 0.3853759765625, 0.42645263671875, 0.467529296875, 0.50860595703125, 0.5496826171875, 0.59075927734375, 0.6318359375, 0.67291259765625, 0.7139892578125, 0.75506591796875, 0.796142578125, 0.83721923828125, 0.8782958984375, 0.91937255859375, 0.96044921875, 1.00152587890625, 1.0426025390625, 1.08367919921875, 1.124755859375, 1.16583251953125, 1.2069091796875, 1.24798583984375, 1.2890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 11.0, 18.0, 25.0, 41.0, 30.0, 63.0, 94.0, 212.0, 279.0, 520.0, 1003.0, 1968.0, 4332.0, 9609.0, 21189.0, 47134.0, 118697.0, 341130.0, 314858.0, 107360.0, 43594.0, 19502.0, 8996.0, 3913.0, 1854.0, 930.0, 486.0, 263.0, 154.0, 94.0, 60.0, 43.0, 20.0, 21.0, 12.0, 9.0, 10.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.65625, -2.55389404296875, -2.4515380859375, -2.34918212890625, -2.246826171875, -2.14447021484375, -2.0421142578125, -1.93975830078125, -1.83740234375, -1.73504638671875, -1.6326904296875, -1.53033447265625, -1.427978515625, -1.32562255859375, -1.2232666015625, -1.12091064453125, -1.0185546875, -0.91619873046875, -0.8138427734375, -0.71148681640625, -0.609130859375, -0.50677490234375, -0.4044189453125, -0.30206298828125, -0.19970703125, -0.09735107421875, 0.0050048828125, 0.10736083984375, 0.209716796875, 0.31207275390625, 0.4144287109375, 0.51678466796875, 0.619140625, 0.72149658203125, 0.8238525390625, 0.92620849609375, 1.028564453125, 1.13092041015625, 1.2332763671875, 1.33563232421875, 1.43798828125, 1.54034423828125, 1.6427001953125, 1.74505615234375, 1.847412109375, 1.94976806640625, 2.0521240234375, 2.15447998046875, 2.2568359375, 2.35919189453125, 2.4615478515625, 2.56390380859375, 2.666259765625, 2.76861572265625, 2.8709716796875, 2.97332763671875, 3.07568359375, 3.17803955078125, 3.2803955078125, 3.38275146484375, 3.485107421875, 3.58746337890625, 3.6898193359375, 3.79217529296875, 3.89453125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 7.0, 3.0, 2.0, 3.0, 6.0, 6.0, 12.0, 9.0, 8.0, 23.0, 15.0, 27.0, 32.0, 20.0, 42.0, 27.0, 36.0, 38.0, 48.0, 47.0, 46.0, 50.0, 43.0, 34.0, 56.0, 37.0, 42.0, 34.0, 33.0, 30.0, 31.0, 30.0, 21.0, 18.0, 20.0, 15.0, 9.0, 14.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.796875, -4.65948486328125, -4.5220947265625, -4.38470458984375, -4.247314453125, -4.10992431640625, -3.9725341796875, -3.83514404296875, -3.69775390625, -3.56036376953125, -3.4229736328125, -3.28558349609375, -3.148193359375, -3.01080322265625, -2.8734130859375, -2.73602294921875, -2.5986328125, -2.46124267578125, -2.3238525390625, -2.18646240234375, -2.049072265625, -1.91168212890625, -1.7742919921875, -1.63690185546875, -1.49951171875, -1.36212158203125, -1.2247314453125, -1.08734130859375, -0.949951171875, -0.81256103515625, -0.6751708984375, -0.53778076171875, -0.400390625, -0.26300048828125, -0.1256103515625, 0.01177978515625, 0.149169921875, 0.28656005859375, 0.4239501953125, 0.56134033203125, 0.69873046875, 0.83612060546875, 0.9735107421875, 1.11090087890625, 1.248291015625, 1.38568115234375, 1.5230712890625, 1.66046142578125, 1.7978515625, 1.93524169921875, 2.0726318359375, 2.21002197265625, 2.347412109375, 2.48480224609375, 2.6221923828125, 2.75958251953125, 2.89697265625, 3.03436279296875, 3.1717529296875, 3.30914306640625, 3.446533203125, 3.58392333984375, 3.7213134765625, 3.85870361328125, 3.99609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 11.0, 16.0, 20.0, 21.0, 30.0, 56.0, 84.0, 91.0, 143.0, 221.0, 319.0, 559.0, 862.0, 1380.0, 2557.0, 4452.0, 7872.0, 14475.0, 26820.0, 49869.0, 99085.0, 206745.0, 294640.0, 165591.0, 80999.0, 41387.0, 22151.0, 12145.0, 6575.0, 3749.0, 2108.0, 1264.0, 789.0, 473.0, 357.0, 205.0, 153.0, 88.0, 54.0, 40.0, 21.0, 24.0, 11.0, 14.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.1083984375, -1.075164794921875, -1.04193115234375, -1.008697509765625, -0.9754638671875, -0.942230224609375, -0.90899658203125, -0.875762939453125, -0.842529296875, -0.809295654296875, -0.77606201171875, -0.742828369140625, -0.7095947265625, -0.676361083984375, -0.64312744140625, -0.609893798828125, -0.57666015625, -0.543426513671875, -0.51019287109375, -0.476959228515625, -0.4437255859375, -0.410491943359375, -0.37725830078125, -0.344024658203125, -0.310791015625, -0.277557373046875, -0.24432373046875, -0.211090087890625, -0.1778564453125, -0.144622802734375, -0.11138916015625, -0.078155517578125, -0.044921875, -0.011688232421875, 0.02154541015625, 0.054779052734375, 0.0880126953125, 0.121246337890625, 0.15447998046875, 0.187713623046875, 0.220947265625, 0.254180908203125, 0.28741455078125, 0.320648193359375, 0.3538818359375, 0.387115478515625, 0.42034912109375, 0.453582763671875, 0.48681640625, 0.520050048828125, 0.55328369140625, 0.586517333984375, 0.6197509765625, 0.652984619140625, 0.68621826171875, 0.719451904296875, 0.752685546875, 0.785919189453125, 0.81915283203125, 0.852386474609375, 0.8856201171875, 0.918853759765625, 0.95208740234375, 0.985321044921875, 1.0185546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 9.0, 10.0, 10.0, 11.0, 15.0, 16.0, 24.0, 31.0, 41.0, 47.0, 93.0, 125.0, 113.0, 127.0, 84.0, 53.0, 40.0, 31.0, 27.0, 16.0, 15.0, 12.0, 10.0, 9.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003561973571777344, -0.0003445148468017578, -0.00033283233642578125, -0.0003211498260498047, -0.0003094673156738281, -0.00029778480529785156, -0.000286102294921875, -0.00027441978454589844, -0.0002627372741699219, -0.0002510547637939453, -0.00023937225341796875, -0.0002276897430419922, -0.00021600723266601562, -0.00020432472229003906, -0.0001926422119140625, -0.00018095970153808594, -0.00016927719116210938, -0.0001575946807861328, -0.00014591217041015625, -0.0001342296600341797, -0.00012254714965820312, -0.00011086463928222656, -9.918212890625e-05, -8.749961853027344e-05, -7.581710815429688e-05, -6.413459777832031e-05, -5.245208740234375e-05, -4.076957702636719e-05, -2.9087066650390625e-05, -1.7404556274414062e-05, -5.7220458984375e-06, 5.9604644775390625e-06, 1.7642974853515625e-05, 2.9325485229492188e-05, 4.100799560546875e-05, 5.269050598144531e-05, 6.437301635742188e-05, 7.605552673339844e-05, 8.7738037109375e-05, 9.942054748535156e-05, 0.00011110305786132812, 0.0001227855682373047, 0.00013446807861328125, 0.0001461505889892578, 0.00015783309936523438, 0.00016951560974121094, 0.0001811981201171875, 0.00019288063049316406, 0.00020456314086914062, 0.0002162456512451172, 0.00022792816162109375, 0.0002396106719970703, 0.0002512931823730469, 0.00026297569274902344, 0.000274658203125, 0.00028634071350097656, 0.0002980232238769531, 0.0003097057342529297, 0.00032138824462890625, 0.0003330707550048828, 0.0003447532653808594, 0.00035643577575683594, 0.0003681182861328125, 0.00037980079650878906, 0.0003914833068847656]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 10.0, 14.0, 25.0, 20.0, 37.0, 51.0, 78.0, 140.0, 232.0, 489.0, 932.0, 1858.0, 4521.0, 10885.0, 27781.0, 74780.0, 208217.0, 393055.0, 205208.0, 73793.0, 27449.0, 10700.0, 4477.0, 1853.0, 884.0, 418.0, 227.0, 122.0, 97.0, 48.0, 41.0, 32.0, 17.0, 12.0, 12.0, 7.0, 6.0, 2.0, 3.0, 6.0, 4.0, 0.0, 3.0, 3.0], "bins": [-1.7333984375, -1.687164306640625, -1.64093017578125, -1.594696044921875, -1.5484619140625, -1.502227783203125, -1.45599365234375, -1.409759521484375, -1.363525390625, -1.317291259765625, -1.27105712890625, -1.224822998046875, -1.1785888671875, -1.132354736328125, -1.08612060546875, -1.039886474609375, -0.99365234375, -0.947418212890625, -0.90118408203125, -0.854949951171875, -0.8087158203125, -0.762481689453125, -0.71624755859375, -0.670013427734375, -0.623779296875, -0.577545166015625, -0.53131103515625, -0.485076904296875, -0.4388427734375, -0.392608642578125, -0.34637451171875, -0.300140380859375, -0.25390625, -0.207672119140625, -0.16143798828125, -0.115203857421875, -0.0689697265625, -0.022735595703125, 0.02349853515625, 0.069732666015625, 0.115966796875, 0.162200927734375, 0.20843505859375, 0.254669189453125, 0.3009033203125, 0.347137451171875, 0.39337158203125, 0.439605712890625, 0.48583984375, 0.532073974609375, 0.57830810546875, 0.624542236328125, 0.6707763671875, 0.717010498046875, 0.76324462890625, 0.809478759765625, 0.855712890625, 0.901947021484375, 0.94818115234375, 0.994415283203125, 1.0406494140625, 1.086883544921875, 1.13311767578125, 1.179351806640625, 1.2255859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 0.0, 7.0, 5.0, 7.0, 4.0, 11.0, 21.0, 14.0, 20.0, 24.0, 30.0, 52.0, 69.0, 80.0, 105.0, 108.0, 100.0, 74.0, 60.0, 41.0, 39.0, 32.0, 18.0, 16.0, 13.0, 13.0, 10.0, 1.0, 4.0, 9.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8623046875, -1.8126068115234375, -1.762908935546875, -1.7132110595703125, -1.66351318359375, -1.6138153076171875, -1.564117431640625, -1.5144195556640625, -1.4647216796875, -1.4150238037109375, -1.365325927734375, -1.3156280517578125, -1.26593017578125, -1.2162322998046875, -1.166534423828125, -1.1168365478515625, -1.067138671875, -1.0174407958984375, -0.967742919921875, -0.9180450439453125, -0.86834716796875, -0.8186492919921875, -0.768951416015625, -0.7192535400390625, -0.6695556640625, -0.6198577880859375, -0.570159912109375, -0.5204620361328125, -0.47076416015625, -0.4210662841796875, -0.371368408203125, -0.3216705322265625, -0.27197265625, -0.2222747802734375, -0.172576904296875, -0.1228790283203125, -0.07318115234375, -0.0234832763671875, 0.026214599609375, 0.0759124755859375, 0.1256103515625, 0.1753082275390625, 0.225006103515625, 0.2747039794921875, 0.32440185546875, 0.3740997314453125, 0.423797607421875, 0.4734954833984375, 0.523193359375, 0.5728912353515625, 0.622589111328125, 0.6722869873046875, 0.72198486328125, 0.7716827392578125, 0.821380615234375, 0.8710784912109375, 0.9207763671875, 0.9704742431640625, 1.020172119140625, 1.0698699951171875, 1.11956787109375, 1.1692657470703125, 1.218963623046875, 1.2686614990234375, 1.318359375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 14.0, 4.0, 24.0, 37.0, 55.0, 69.0, 94.0, 100.0, 116.0, 104.0, 102.0, 89.0, 64.0, 48.0, 35.0, 21.0, 14.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.319637298583984, -21.731767654418945, -21.143896102905273, -20.556026458740234, -19.968154907226562, -19.380285263061523, -18.792415618896484, -18.204544067382812, -17.616674423217773, -17.028804779052734, -16.440933227539062, -15.853063583374023, -15.265192985534668, -14.677322387695312, -14.089452743530273, -13.501582145690918, -12.913711547851562, -12.325840950012207, -11.737970352172852, -11.150100708007812, -10.562230110168457, -9.974359512329102, -9.386489868164062, -8.798619270324707, -8.210748672485352, -7.622878074645996, -7.035007953643799, -6.447137832641602, -5.859267234802246, -5.271396636962891, -4.683526515960693, -4.095656394958496, -3.507783889770508, -2.9199135303497314, -2.332043170928955, -1.7441728115081787, -1.1563024520874023, -0.568432092666626, 0.01943826675415039, 0.6073083877563477, 1.1951789855957031, 1.7830493450164795, 2.370919704437256, 2.9587900638580322, 3.5466604232788086, 4.134531021118164, 4.722401142120361, 5.310271263122559, 5.898141860961914, 6.4860124588012695, 7.073882579803467, 7.661752700805664, 8.24962329864502, 8.837493896484375, 9.425363540649414, 10.01323413848877, 10.601104736328125, 11.18897533416748, 11.776845932006836, 12.364715576171875, 12.95258617401123, 13.540456771850586, 14.128326416015625, 14.71619701385498, 15.304067611694336]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 2.0, 6.0, 11.0, 8.0, 11.0, 17.0, 13.0, 18.0, 20.0, 21.0, 18.0, 28.0, 35.0, 35.0, 33.0, 32.0, 41.0, 40.0, 40.0, 53.0, 44.0, 45.0, 42.0, 38.0, 41.0, 40.0, 32.0, 35.0, 22.0, 27.0, 22.0, 20.0, 22.0, 21.0, 13.0, 12.0, 10.0, 6.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0], "bins": [-13.945759773254395, -13.527469635009766, -13.109179496765137, -12.690889358520508, -12.272599220275879, -11.85430908203125, -11.436019897460938, -11.017728805541992, -10.59943962097168, -10.18114948272705, -9.762859344482422, -9.344569206237793, -8.926279067993164, -8.507988929748535, -8.089698791503906, -7.6714091300964355, -7.253118515014648, -6.8348283767700195, -6.416538238525391, -5.998248100280762, -5.579957962036133, -5.161667823791504, -4.743378162384033, -4.325088024139404, -3.9067978858947754, -3.4885077476501465, -3.0702176094055176, -2.6519277095794678, -2.233637571334839, -1.81534743309021, -1.3970575332641602, -0.9787673950195312, -0.5604782104492188, -0.14218813180923462, 0.2761019468307495, 0.6943919658660889, 1.1126821041107178, 1.5309722423553467, 1.9492621421813965, 2.3675522804260254, 2.7858424186706543, 3.204132556915283, 3.622422695159912, 4.040712356567383, 4.459002494812012, 4.877292633056641, 5.2955827713012695, 5.713872909545898, 6.132163047790527, 6.550453186035156, 6.968743324279785, 7.387033462524414, 7.805323600769043, 8.223613739013672, 8.641902923583984, 9.06019401550293, 9.478483200073242, 9.896773338317871, 10.3150634765625, 10.733353614807129, 11.151643753051758, 11.569933891296387, 11.988224029541016, 12.406513214111328, 12.824804306030273]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 10.0, 21.0, 21.0, 40.0, 45.0, 73.0, 107.0, 167.0, 240.0, 377.0, 592.0, 865.0, 1477.0, 2240.0, 3820.0, 6502.0, 11812.0, 22672.0, 45071.0, 96032.0, 229414.0, 697434.0, 1902582.0, 738526.0, 238225.0, 99636.0, 45729.0, 22525.0, 11810.0, 6499.0, 3775.0, 2130.0, 1255.0, 840.0, 552.0, 355.0, 233.0, 176.0, 123.0, 84.0, 51.0, 38.0, 32.0, 20.0, 14.0, 8.0, 7.0, 5.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.654296875, -1.5982513427734375, -1.542205810546875, -1.4861602783203125, -1.43011474609375, -1.3740692138671875, -1.318023681640625, -1.2619781494140625, -1.2059326171875, -1.1498870849609375, -1.093841552734375, -1.0377960205078125, -0.98175048828125, -0.9257049560546875, -0.869659423828125, -0.8136138916015625, -0.757568359375, -0.7015228271484375, -0.645477294921875, -0.5894317626953125, -0.53338623046875, -0.4773406982421875, -0.421295166015625, -0.3652496337890625, -0.3092041015625, -0.2531585693359375, -0.197113037109375, -0.1410675048828125, -0.08502197265625, -0.0289764404296875, 0.027069091796875, 0.0831146240234375, 0.13916015625, 0.1952056884765625, 0.251251220703125, 0.3072967529296875, 0.36334228515625, 0.4193878173828125, 0.475433349609375, 0.5314788818359375, 0.5875244140625, 0.6435699462890625, 0.699615478515625, 0.7556610107421875, 0.81170654296875, 0.8677520751953125, 0.923797607421875, 0.9798431396484375, 1.035888671875, 1.0919342041015625, 1.147979736328125, 1.2040252685546875, 1.26007080078125, 1.3161163330078125, 1.372161865234375, 1.4282073974609375, 1.4842529296875, 1.5402984619140625, 1.596343994140625, 1.6523895263671875, 1.70843505859375, 1.7644805908203125, 1.820526123046875, 1.8765716552734375, 1.9326171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 3.0, 2.0, 9.0, 4.0, 15.0, 13.0, 4.0, 14.0, 14.0, 14.0, 22.0, 17.0, 30.0, 40.0, 40.0, 42.0, 44.0, 35.0, 53.0, 44.0, 38.0, 36.0, 48.0, 33.0, 33.0, 36.0, 42.0, 37.0, 41.0, 31.0, 25.0, 27.0, 19.0, 15.0, 12.0, 10.0, 9.0, 13.0, 6.0, 5.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.20703125, -1.165924072265625, -1.12481689453125, -1.083709716796875, -1.0426025390625, -1.001495361328125, -0.96038818359375, -0.919281005859375, -0.878173828125, -0.837066650390625, -0.79595947265625, -0.754852294921875, -0.7137451171875, -0.672637939453125, -0.63153076171875, -0.590423583984375, -0.54931640625, -0.508209228515625, -0.46710205078125, -0.425994873046875, -0.3848876953125, -0.343780517578125, -0.30267333984375, -0.261566162109375, -0.220458984375, -0.179351806640625, -0.13824462890625, -0.097137451171875, -0.0560302734375, -0.014923095703125, 0.02618408203125, 0.067291259765625, 0.1083984375, 0.149505615234375, 0.19061279296875, 0.231719970703125, 0.2728271484375, 0.313934326171875, 0.35504150390625, 0.396148681640625, 0.437255859375, 0.478363037109375, 0.51947021484375, 0.560577392578125, 0.6016845703125, 0.642791748046875, 0.68389892578125, 0.725006103515625, 0.76611328125, 0.807220458984375, 0.84832763671875, 0.889434814453125, 0.9305419921875, 0.971649169921875, 1.01275634765625, 1.053863525390625, 1.094970703125, 1.136077880859375, 1.17718505859375, 1.218292236328125, 1.2593994140625, 1.300506591796875, 1.34161376953125, 1.382720947265625, 1.423828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 6.0, 6.0, 8.0, 19.0, 22.0, 27.0, 44.0, 62.0, 71.0, 127.0, 204.0, 298.0, 669.0, 1437.0, 3881.0, 12730.0, 50799.0, 258966.0, 2273973.0, 1363857.0, 175472.0, 36454.0, 9480.0, 3150.0, 1174.0, 516.0, 307.0, 149.0, 107.0, 57.0, 53.0, 36.0, 31.0, 19.0, 7.0, 19.0, 15.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.53125, -4.3687744140625, -4.206298828125, -4.0438232421875, -3.88134765625, -3.7188720703125, -3.556396484375, -3.3939208984375, -3.2314453125, -3.0689697265625, -2.906494140625, -2.7440185546875, -2.58154296875, -2.4190673828125, -2.256591796875, -2.0941162109375, -1.931640625, -1.7691650390625, -1.606689453125, -1.4442138671875, -1.28173828125, -1.1192626953125, -0.956787109375, -0.7943115234375, -0.6318359375, -0.4693603515625, -0.306884765625, -0.1444091796875, 0.01806640625, 0.1805419921875, 0.343017578125, 0.5054931640625, 0.66796875, 0.8304443359375, 0.992919921875, 1.1553955078125, 1.31787109375, 1.4803466796875, 1.642822265625, 1.8052978515625, 1.9677734375, 2.1302490234375, 2.292724609375, 2.4552001953125, 2.61767578125, 2.7801513671875, 2.942626953125, 3.1051025390625, 3.267578125, 3.4300537109375, 3.592529296875, 3.7550048828125, 3.91748046875, 4.0799560546875, 4.242431640625, 4.4049072265625, 4.5673828125, 4.7298583984375, 4.892333984375, 5.0548095703125, 5.21728515625, 5.3797607421875, 5.542236328125, 5.7047119140625, 5.8671875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 14.0, 25.0, 38.0, 63.0, 95.0, 152.0, 282.0, 464.0, 982.0, 956.0, 461.0, 213.0, 127.0, 77.0, 50.0, 27.0, 13.0, 10.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.41796875, -7.24505615234375, -7.0721435546875, -6.89923095703125, -6.726318359375, -6.55340576171875, -6.3804931640625, -6.20758056640625, -6.03466796875, -5.86175537109375, -5.6888427734375, -5.51593017578125, -5.343017578125, -5.17010498046875, -4.9971923828125, -4.82427978515625, -4.6513671875, -4.47845458984375, -4.3055419921875, -4.13262939453125, -3.959716796875, -3.78680419921875, -3.6138916015625, -3.44097900390625, -3.26806640625, -3.09515380859375, -2.9222412109375, -2.74932861328125, -2.576416015625, -2.40350341796875, -2.2305908203125, -2.05767822265625, -1.884765625, -1.71185302734375, -1.5389404296875, -1.36602783203125, -1.193115234375, -1.02020263671875, -0.8472900390625, -0.67437744140625, -0.50146484375, -0.32855224609375, -0.1556396484375, 0.01727294921875, 0.190185546875, 0.36309814453125, 0.5360107421875, 0.70892333984375, 0.8818359375, 1.05474853515625, 1.2276611328125, 1.40057373046875, 1.573486328125, 1.74639892578125, 1.9193115234375, 2.09222412109375, 2.26513671875, 2.43804931640625, 2.6109619140625, 2.78387451171875, 2.956787109375, 3.12969970703125, 3.3026123046875, 3.47552490234375, 3.6484375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 17.0, 32.0, 59.0, 109.0, 125.0, 126.0, 148.0, 132.0, 96.0, 69.0, 35.0, 24.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.11302185058594, -36.29410934448242, -35.475196838378906, -34.65628433227539, -33.837371826171875, -33.01845932006836, -32.199546813964844, -31.380632400512695, -30.56171989440918, -29.742807388305664, -28.92389488220215, -28.104982376098633, -27.286067962646484, -26.46715545654297, -25.648242950439453, -24.829330444335938, -24.010417938232422, -23.191505432128906, -22.37259292602539, -21.553680419921875, -20.73476791381836, -19.915855407714844, -19.096940994262695, -18.27802848815918, -17.459115982055664, -16.64020347595215, -15.821290969848633, -15.0023775100708, -14.183465003967285, -13.36455249786377, -12.545639038085938, -11.726726531982422, -10.907815933227539, -10.088903427124023, -9.269990921020508, -8.451077461242676, -7.63216495513916, -6.8132524490356445, -5.994339466094971, -5.175426483154297, -4.356513977050781, -3.5376012325286865, -2.718688488006592, -1.899775743484497, -1.0808629989624023, -0.2619504928588867, 0.5569624900817871, 1.375875473022461, 2.1947879791259766, 3.0137007236480713, 3.832613468170166, 4.65152645111084, 5.4704389572143555, 6.289351463317871, 7.108264446258545, 7.927177429199219, 8.746089935302734, 9.56500244140625, 10.383914947509766, 11.202828407287598, 12.021740913391113, 12.840653419494629, 13.659566879272461, 14.478479385375977, 15.297391891479492]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 8.0, 9.0, 15.0, 5.0, 16.0, 18.0, 25.0, 22.0, 21.0, 21.0, 35.0, 37.0, 37.0, 36.0, 37.0, 36.0, 35.0, 37.0, 41.0, 38.0, 39.0, 39.0, 37.0, 30.0, 32.0, 37.0, 37.0, 27.0, 24.0, 19.0, 19.0, 19.0, 15.0, 21.0, 13.0, 9.0, 3.0, 12.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.630386352539062, -10.316021919250488, -10.001657485961914, -9.68729305267334, -9.372928619384766, -9.058563232421875, -8.7441987991333, -8.429834365844727, -8.115469932556152, -7.801105499267578, -7.486741065979004, -7.1723761558532715, -6.858011722564697, -6.543647289276123, -6.229282379150391, -5.914917945861816, -5.600553512573242, -5.286189079284668, -4.971824645996094, -4.657459735870361, -4.343095302581787, -4.028730869293213, -3.7143661975860596, -3.4000015258789062, -3.085637092590332, -2.771272659301758, -2.4569079875946045, -2.142543315887451, -1.828178882598877, -1.5138143301010132, -1.1994497776031494, -0.8850851058959961, -0.5707206726074219, -0.2563561201095581, 0.058008432388305664, 0.37237298488616943, 0.6867375373840332, 1.001102089881897, 1.3154666423797607, 1.629831314086914, 1.9441957473754883, 2.2585601806640625, 2.572924852371216, 2.887289524078369, 3.2016539573669434, 3.5160183906555176, 3.830383062362671, 4.144747734069824, 4.459112167358398, 4.773476600646973, 5.087841033935547, 5.402205944061279, 5.7165703773498535, 6.030934810638428, 6.34529972076416, 6.659664154052734, 6.974028587341309, 7.288393020629883, 7.602757453918457, 7.9171223640441895, 8.231487274169922, 8.545851707458496, 8.86021614074707, 9.174580574035645, 9.488945007324219]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 7.0, 9.0, 5.0, 14.0, 25.0, 42.0, 55.0, 70.0, 109.0, 140.0, 225.0, 320.0, 489.0, 706.0, 1003.0, 1563.0, 2218.0, 3604.0, 5607.0, 9284.0, 15591.0, 27698.0, 58694.0, 163377.0, 388257.0, 217629.0, 72672.0, 33058.0, 17838.0, 10229.0, 6216.0, 3931.0, 2626.0, 1731.0, 1095.0, 785.0, 510.0, 336.0, 235.0, 192.0, 111.0, 69.0, 48.0, 38.0, 37.0, 15.0, 12.0, 16.0, 7.0, 4.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-2.53125, -2.455963134765625, -2.38067626953125, -2.305389404296875, -2.2301025390625, -2.154815673828125, -2.07952880859375, -2.004241943359375, -1.928955078125, -1.853668212890625, -1.77838134765625, -1.703094482421875, -1.6278076171875, -1.552520751953125, -1.47723388671875, -1.401947021484375, -1.32666015625, -1.251373291015625, -1.17608642578125, -1.100799560546875, -1.0255126953125, -0.950225830078125, -0.87493896484375, -0.799652099609375, -0.724365234375, -0.649078369140625, -0.57379150390625, -0.498504638671875, -0.4232177734375, -0.347930908203125, -0.27264404296875, -0.197357177734375, -0.1220703125, -0.046783447265625, 0.02850341796875, 0.103790283203125, 0.1790771484375, 0.254364013671875, 0.32965087890625, 0.404937744140625, 0.480224609375, 0.555511474609375, 0.63079833984375, 0.706085205078125, 0.7813720703125, 0.856658935546875, 0.93194580078125, 1.007232666015625, 1.08251953125, 1.157806396484375, 1.23309326171875, 1.308380126953125, 1.3836669921875, 1.458953857421875, 1.53424072265625, 1.609527587890625, 1.684814453125, 1.760101318359375, 1.83538818359375, 1.910675048828125, 1.9859619140625, 2.061248779296875, 2.13653564453125, 2.211822509765625, 2.287109375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 3.0, 10.0, 11.0, 20.0, 25.0, 26.0, 32.0, 30.0, 23.0, 31.0, 34.0, 48.0, 46.0, 50.0, 59.0, 54.0, 47.0, 54.0, 32.0, 41.0, 35.0, 40.0, 27.0, 36.0, 27.0, 28.0, 21.0, 22.0, 19.0, 14.0, 9.0, 8.0, 4.0, 7.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8154296875, -1.76361083984375, -1.7117919921875, -1.65997314453125, -1.608154296875, -1.55633544921875, -1.5045166015625, -1.45269775390625, -1.40087890625, -1.34906005859375, -1.2972412109375, -1.24542236328125, -1.193603515625, -1.14178466796875, -1.0899658203125, -1.03814697265625, -0.986328125, -0.93450927734375, -0.8826904296875, -0.83087158203125, -0.779052734375, -0.72723388671875, -0.6754150390625, -0.62359619140625, -0.57177734375, -0.51995849609375, -0.4681396484375, -0.41632080078125, -0.364501953125, -0.31268310546875, -0.2608642578125, -0.20904541015625, -0.1572265625, -0.10540771484375, -0.0535888671875, -0.00177001953125, 0.050048828125, 0.10186767578125, 0.1536865234375, 0.20550537109375, 0.25732421875, 0.30914306640625, 0.3609619140625, 0.41278076171875, 0.464599609375, 0.51641845703125, 0.5682373046875, 0.62005615234375, 0.671875, 0.72369384765625, 0.7755126953125, 0.82733154296875, 0.879150390625, 0.93096923828125, 0.9827880859375, 1.03460693359375, 1.08642578125, 1.13824462890625, 1.1900634765625, 1.24188232421875, 1.293701171875, 1.34552001953125, 1.3973388671875, 1.44915771484375, 1.5009765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 11.0, 14.0, 16.0, 29.0, 51.0, 86.0, 145.0, 223.0, 439.0, 772.0, 1601.0, 3294.0, 7017.0, 14795.0, 35566.0, 116166.0, 474850.0, 284086.0, 64735.0, 23978.0, 10599.0, 4971.0, 2451.0, 1259.0, 592.0, 313.0, 164.0, 109.0, 66.0, 34.0, 38.0, 17.0, 19.0, 10.0, 7.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.689453125, -3.576904296875, -3.46435546875, -3.351806640625, -3.2392578125, -3.126708984375, -3.01416015625, -2.901611328125, -2.7890625, -2.676513671875, -2.56396484375, -2.451416015625, -2.3388671875, -2.226318359375, -2.11376953125, -2.001220703125, -1.888671875, -1.776123046875, -1.66357421875, -1.551025390625, -1.4384765625, -1.325927734375, -1.21337890625, -1.100830078125, -0.98828125, -0.875732421875, -0.76318359375, -0.650634765625, -0.5380859375, -0.425537109375, -0.31298828125, -0.200439453125, -0.087890625, 0.024658203125, 0.13720703125, 0.249755859375, 0.3623046875, 0.474853515625, 0.58740234375, 0.699951171875, 0.8125, 0.925048828125, 1.03759765625, 1.150146484375, 1.2626953125, 1.375244140625, 1.48779296875, 1.600341796875, 1.712890625, 1.825439453125, 1.93798828125, 2.050537109375, 2.1630859375, 2.275634765625, 2.38818359375, 2.500732421875, 2.61328125, 2.725830078125, 2.83837890625, 2.950927734375, 3.0634765625, 3.176025390625, 3.28857421875, 3.401123046875, 3.513671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 8.0, 9.0, 10.0, 6.0, 21.0, 19.0, 15.0, 18.0, 24.0, 17.0, 21.0, 26.0, 28.0, 29.0, 30.0, 30.0, 37.0, 30.0, 28.0, 48.0, 38.0, 28.0, 34.0, 37.0, 37.0, 26.0, 35.0, 31.0, 21.0, 27.0, 22.0, 21.0, 22.0, 21.0, 18.0, 16.0, 15.0, 12.0, 10.0, 5.0, 12.0, 13.0, 6.0, 2.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.453125, -3.3436279296875, -3.234130859375, -3.1246337890625, -3.01513671875, -2.9056396484375, -2.796142578125, -2.6866455078125, -2.5771484375, -2.4676513671875, -2.358154296875, -2.2486572265625, -2.13916015625, -2.0296630859375, -1.920166015625, -1.8106689453125, -1.701171875, -1.5916748046875, -1.482177734375, -1.3726806640625, -1.26318359375, -1.1536865234375, -1.044189453125, -0.9346923828125, -0.8251953125, -0.7156982421875, -0.606201171875, -0.4967041015625, -0.38720703125, -0.2777099609375, -0.168212890625, -0.0587158203125, 0.05078125, 0.1602783203125, 0.269775390625, 0.3792724609375, 0.48876953125, 0.5982666015625, 0.707763671875, 0.8172607421875, 0.9267578125, 1.0362548828125, 1.145751953125, 1.2552490234375, 1.36474609375, 1.4742431640625, 1.583740234375, 1.6932373046875, 1.802734375, 1.9122314453125, 2.021728515625, 2.1312255859375, 2.24072265625, 2.3502197265625, 2.459716796875, 2.5692138671875, 2.6787109375, 2.7882080078125, 2.897705078125, 3.0072021484375, 3.11669921875, 3.2261962890625, 3.335693359375, 3.4451904296875, 3.5546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 11.0, 16.0, 28.0, 40.0, 41.0, 86.0, 110.0, 189.0, 281.0, 482.0, 827.0, 1443.0, 2489.0, 4670.0, 8501.0, 15734.0, 30276.0, 59858.0, 129268.0, 311052.0, 267872.0, 107535.0, 51339.0, 25900.0, 13679.0, 7398.0, 4001.0, 2266.0, 1269.0, 741.0, 399.0, 274.0, 151.0, 110.0, 81.0, 40.0, 27.0, 23.0, 8.0, 12.0, 7.0, 5.0, 3.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9676971435546875, -0.936370849609375, -0.9050445556640625, -0.87371826171875, -0.8423919677734375, -0.811065673828125, -0.7797393798828125, -0.7484130859375, -0.7170867919921875, -0.685760498046875, -0.6544342041015625, -0.62310791015625, -0.5917816162109375, -0.560455322265625, -0.5291290283203125, -0.497802734375, -0.4664764404296875, -0.435150146484375, -0.4038238525390625, -0.37249755859375, -0.3411712646484375, -0.309844970703125, -0.2785186767578125, -0.2471923828125, -0.2158660888671875, -0.184539794921875, -0.1532135009765625, -0.12188720703125, -0.0905609130859375, -0.059234619140625, -0.0279083251953125, 0.00341796875, 0.0347442626953125, 0.066070556640625, 0.0973968505859375, 0.12872314453125, 0.1600494384765625, 0.191375732421875, 0.2227020263671875, 0.2540283203125, 0.2853546142578125, 0.316680908203125, 0.3480072021484375, 0.37933349609375, 0.4106597900390625, 0.441986083984375, 0.4733123779296875, 0.504638671875, 0.5359649658203125, 0.567291259765625, 0.5986175537109375, 0.62994384765625, 0.6612701416015625, 0.692596435546875, 0.7239227294921875, 0.7552490234375, 0.7865753173828125, 0.817901611328125, 0.8492279052734375, 0.88055419921875, 0.9118804931640625, 0.943206787109375, 0.9745330810546875, 1.005859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 10.0, 8.0, 13.0, 23.0, 18.0, 33.0, 43.0, 87.0, 135.0, 181.0, 149.0, 82.0, 54.0, 41.0, 23.0, 19.0, 14.0, 14.0, 16.0, 5.0, 5.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003495216369628906, -0.000337306410074234, -0.0003250911831855774, -0.0003128759562969208, -0.00030066072940826416, -0.00028844550251960754, -0.00027623027563095093, -0.0002640150487422943, -0.0002517998218536377, -0.00023958459496498108, -0.00022736936807632446, -0.00021515414118766785, -0.00020293891429901123, -0.00019072368741035461, -0.000178508460521698, -0.00016629323363304138, -0.00015407800674438477, -0.00014186277985572815, -0.00012964755296707153, -0.00011743232607841492, -0.0001052170991897583, -9.300187230110168e-05, -8.078664541244507e-05, -6.857141852378845e-05, -5.6356191635131836e-05, -4.414096474647522e-05, -3.1925737857818604e-05, -1.9710510969161987e-05, -7.495284080505371e-06, 4.719942808151245e-06, 1.693516969680786e-05, 2.9150396585464478e-05, 4.1365623474121094e-05, 5.358085036277771e-05, 6.579607725143433e-05, 7.801130414009094e-05, 9.022653102874756e-05, 0.00010244175791740417, 0.00011465698480606079, 0.0001268722116947174, 0.00013908743858337402, 0.00015130266547203064, 0.00016351789236068726, 0.00017573311924934387, 0.0001879483461380005, 0.0002001635730266571, 0.00021237879991531372, 0.00022459402680397034, 0.00023680925369262695, 0.00024902448058128357, 0.0002612397074699402, 0.0002734549343585968, 0.0002856701612472534, 0.00029788538813591003, 0.00031010061502456665, 0.00032231584191322327, 0.0003345310688018799, 0.0003467462956905365, 0.0003589615225791931, 0.00037117674946784973, 0.00038339197635650635, 0.00039560720324516296, 0.0004078224301338196, 0.0004200376570224762, 0.0004322528839111328]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 14.0, 12.0, 22.0, 37.0, 64.0, 90.0, 134.0, 247.0, 491.0, 1061.0, 2634.0, 6564.0, 18900.0, 58192.0, 208554.0, 489618.0, 182510.0, 51788.0, 17003.0, 6077.0, 2389.0, 1046.0, 433.0, 276.0, 146.0, 80.0, 57.0, 32.0, 20.0, 16.0, 9.0, 8.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4443359375, -1.3917236328125, -1.339111328125, -1.2864990234375, -1.23388671875, -1.1812744140625, -1.128662109375, -1.0760498046875, -1.0234375, -0.9708251953125, -0.918212890625, -0.8656005859375, -0.81298828125, -0.7603759765625, -0.707763671875, -0.6551513671875, -0.6025390625, -0.5499267578125, -0.497314453125, -0.4447021484375, -0.39208984375, -0.3394775390625, -0.286865234375, -0.2342529296875, -0.181640625, -0.1290283203125, -0.076416015625, -0.0238037109375, 0.02880859375, 0.0814208984375, 0.134033203125, 0.1866455078125, 0.2392578125, 0.2918701171875, 0.344482421875, 0.3970947265625, 0.44970703125, 0.5023193359375, 0.554931640625, 0.6075439453125, 0.66015625, 0.7127685546875, 0.765380859375, 0.8179931640625, 0.87060546875, 0.9232177734375, 0.975830078125, 1.0284423828125, 1.0810546875, 1.1336669921875, 1.186279296875, 1.2388916015625, 1.29150390625, 1.3441162109375, 1.396728515625, 1.4493408203125, 1.501953125, 1.5545654296875, 1.607177734375, 1.6597900390625, 1.71240234375, 1.7650146484375, 1.817626953125, 1.8702392578125, 1.9228515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 5.0, 5.0, 4.0, 7.0, 8.0, 13.0, 22.0, 25.0, 23.0, 30.0, 29.0, 37.0, 37.0, 47.0, 63.0, 89.0, 73.0, 77.0, 58.0, 61.0, 48.0, 44.0, 29.0, 25.0, 26.0, 26.0, 20.0, 15.0, 7.0, 5.0, 1.0, 7.0, 6.0, 7.0, 5.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9287109375, -0.8962249755859375, -0.863739013671875, -0.8312530517578125, -0.79876708984375, -0.7662811279296875, -0.733795166015625, -0.7013092041015625, -0.6688232421875, -0.6363372802734375, -0.603851318359375, -0.5713653564453125, -0.53887939453125, -0.5063934326171875, -0.473907470703125, -0.4414215087890625, -0.408935546875, -0.3764495849609375, -0.343963623046875, -0.3114776611328125, -0.27899169921875, -0.2465057373046875, -0.214019775390625, -0.1815338134765625, -0.1490478515625, -0.1165618896484375, -0.084075927734375, -0.0515899658203125, -0.01910400390625, 0.0133819580078125, 0.045867919921875, 0.0783538818359375, 0.11083984375, 0.1433258056640625, 0.175811767578125, 0.2082977294921875, 0.24078369140625, 0.2732696533203125, 0.305755615234375, 0.3382415771484375, 0.3707275390625, 0.4032135009765625, 0.435699462890625, 0.4681854248046875, 0.50067138671875, 0.5331573486328125, 0.565643310546875, 0.5981292724609375, 0.630615234375, 0.6631011962890625, 0.695587158203125, 0.7280731201171875, 0.76055908203125, 0.7930450439453125, 0.825531005859375, 0.8580169677734375, 0.8905029296875, 0.9229888916015625, 0.955474853515625, 0.9879608154296875, 1.02044677734375, 1.0529327392578125, 1.085418701171875, 1.1179046630859375, 1.150390625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 7.0, 21.0, 39.0, 60.0, 88.0, 129.0, 142.0, 152.0, 132.0, 89.0, 54.0, 32.0, 21.0, 22.0, 8.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.992462158203125, -9.36529541015625, -8.738128662109375, -8.1109619140625, -7.483795166015625, -6.85662841796875, -6.229461193084717, -5.602294445037842, -4.975127696990967, -4.347960948944092, -3.720794200897217, -3.0936272144317627, -2.4664604663848877, -1.8392937183380127, -1.2121267318725586, -0.5849599838256836, 0.042206764221191406, 0.6693735718727112, 1.296540379524231, 1.9237072467803955, 2.5508739948272705, 3.1780407428741455, 3.8052077293395996, 4.432374477386475, 5.05954122543335, 5.686707973480225, 6.3138747215271, 6.941041946411133, 7.568208694458008, 8.195375442504883, 8.822542190551758, 9.449708938598633, 10.076875686645508, 10.704042434692383, 11.331209182739258, 11.958375930786133, 12.585542678833008, 13.212709426879883, 13.839876174926758, 14.467042922973633, 15.094209671020508, 15.721376419067383, 16.348543167114258, 16.975709915161133, 17.602876663208008, 18.230043411254883, 18.857210159301758, 19.484376907348633, 20.11154556274414, 20.738712310791016, 21.36587905883789, 21.993045806884766, 22.62021255493164, 23.247379302978516, 23.87454605102539, 24.501712799072266, 25.12887954711914, 25.756046295166016, 26.38321304321289, 27.010379791259766, 27.63754653930664, 28.264713287353516, 28.89188003540039, 29.519046783447266, 30.14621353149414]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 11.0, 6.0, 6.0, 13.0, 10.0, 11.0, 17.0, 14.0, 37.0, 23.0, 29.0, 35.0, 38.0, 32.0, 37.0, 26.0, 32.0, 37.0, 36.0, 30.0, 36.0, 32.0, 42.0, 43.0, 38.0, 39.0, 23.0, 31.0, 20.0, 16.0, 23.0, 14.0, 22.0, 17.0, 14.0, 14.0, 13.0, 17.0, 10.0, 7.0, 6.0, 6.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.290658950805664, -9.01656436920166, -8.742469787597656, -8.468375205993652, -8.194280624389648, -7.920185565948486, -7.646090507507324, -7.37199592590332, -7.097901344299316, -6.8238067626953125, -6.549712181091309, -6.2756171226501465, -6.001522541046143, -5.727427959442139, -5.453332901000977, -5.179238319396973, -4.905143737792969, -4.631049156188965, -4.356954574584961, -4.082859516143799, -3.808764934539795, -3.534670352935791, -3.260575532913208, -2.986480712890625, -2.712386131286621, -2.438291549682617, -2.164196729660034, -1.8901020288467407, -1.6160073280334473, -1.3419126272201538, -1.0678179264068604, -0.7937232255935669, -0.519627571105957, -0.24553287029266357, 0.028561830520629883, 0.30265653133392334, 0.5767512321472168, 0.8508459329605103, 1.1249406337738037, 1.3990353345870972, 1.6731300354003906, 1.947224736213684, 2.2213194370269775, 2.4954142570495605, 2.7695088386535645, 3.0436034202575684, 3.3176982402801514, 3.5917930603027344, 3.8658876419067383, 4.139982223510742, 4.414076805114746, 4.688171863555908, 4.962266445159912, 5.236361026763916, 5.510456085205078, 5.784550666809082, 6.058645248413086, 6.33273983001709, 6.606834411621094, 6.880929470062256, 7.15502405166626, 7.429118633270264, 7.703213691711426, 7.97730827331543, 8.251402854919434]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 20.0, 12.0, 23.0, 27.0, 36.0, 65.0, 74.0, 107.0, 195.0, 288.0, 396.0, 625.0, 1075.0, 1674.0, 2892.0, 5006.0, 8970.0, 17515.0, 35910.0, 80716.0, 211024.0, 781850.0, 2164238.0, 571941.0, 172689.0, 69915.0, 32015.0, 15818.0, 8089.0, 4486.0, 2553.0, 1472.0, 968.0, 532.0, 358.0, 214.0, 152.0, 102.0, 68.0, 47.0, 41.0, 19.0, 21.0, 9.0, 7.0, 8.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0], "bins": [-2.39453125, -2.322845458984375, -2.25115966796875, -2.179473876953125, -2.1077880859375, -2.036102294921875, -1.96441650390625, -1.892730712890625, -1.821044921875, -1.749359130859375, -1.67767333984375, -1.605987548828125, -1.5343017578125, -1.462615966796875, -1.39093017578125, -1.319244384765625, -1.24755859375, -1.175872802734375, -1.10418701171875, -1.032501220703125, -0.9608154296875, -0.889129638671875, -0.81744384765625, -0.745758056640625, -0.674072265625, -0.602386474609375, -0.53070068359375, -0.459014892578125, -0.3873291015625, -0.315643310546875, -0.24395751953125, -0.172271728515625, -0.1005859375, -0.028900146484375, 0.04278564453125, 0.114471435546875, 0.1861572265625, 0.257843017578125, 0.32952880859375, 0.401214599609375, 0.472900390625, 0.544586181640625, 0.61627197265625, 0.687957763671875, 0.7596435546875, 0.831329345703125, 0.90301513671875, 0.974700927734375, 1.04638671875, 1.118072509765625, 1.18975830078125, 1.261444091796875, 1.3331298828125, 1.404815673828125, 1.47650146484375, 1.548187255859375, 1.619873046875, 1.691558837890625, 1.76324462890625, 1.834930419921875, 1.9066162109375, 1.978302001953125, 2.04998779296875, 2.121673583984375, 2.193359375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 6.0, 17.0, 9.0, 26.0, 17.0, 16.0, 27.0, 34.0, 28.0, 30.0, 40.0, 39.0, 38.0, 39.0, 30.0, 42.0, 49.0, 37.0, 53.0, 50.0, 40.0, 47.0, 35.0, 31.0, 30.0, 29.0, 24.0, 22.0, 13.0, 11.0, 13.0, 12.0, 21.0, 6.0, 6.0, 8.0, 2.0, 2.0, 2.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.3735809326171875, -1.327239990234375, -1.2808990478515625, -1.23455810546875, -1.1882171630859375, -1.141876220703125, -1.0955352783203125, -1.0491943359375, -1.0028533935546875, -0.956512451171875, -0.9101715087890625, -0.86383056640625, -0.8174896240234375, -0.771148681640625, -0.7248077392578125, -0.678466796875, -0.6321258544921875, -0.585784912109375, -0.5394439697265625, -0.49310302734375, -0.4467620849609375, -0.400421142578125, -0.3540802001953125, -0.3077392578125, -0.2613983154296875, -0.215057373046875, -0.1687164306640625, -0.12237548828125, -0.0760345458984375, -0.029693603515625, 0.0166473388671875, 0.06298828125, 0.1093292236328125, 0.155670166015625, 0.2020111083984375, 0.24835205078125, 0.2946929931640625, 0.341033935546875, 0.3873748779296875, 0.4337158203125, 0.4800567626953125, 0.526397705078125, 0.5727386474609375, 0.61907958984375, 0.6654205322265625, 0.711761474609375, 0.7581024169921875, 0.804443359375, 0.8507843017578125, 0.897125244140625, 0.9434661865234375, 0.98980712890625, 1.0361480712890625, 1.082489013671875, 1.1288299560546875, 1.1751708984375, 1.2215118408203125, 1.267852783203125, 1.3141937255859375, 1.36053466796875, 1.4068756103515625, 1.453216552734375, 1.4995574951171875, 1.5458984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 5.0, 13.0, 8.0, 22.0, 37.0, 41.0, 79.0, 110.0, 174.0, 298.0, 513.0, 845.0, 1588.0, 2792.0, 5538.0, 11355.0, 24782.0, 57065.0, 142546.0, 421188.0, 1901029.0, 1156570.0, 283404.0, 103607.0, 42400.0, 19189.0, 8994.0, 4551.0, 2320.0, 1234.0, 762.0, 440.0, 274.0, 182.0, 107.0, 75.0, 51.0, 34.0, 18.0, 15.0, 12.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.193359375, -3.096099853515625, -2.99884033203125, -2.901580810546875, -2.8043212890625, -2.707061767578125, -2.60980224609375, -2.512542724609375, -2.415283203125, -2.318023681640625, -2.22076416015625, -2.123504638671875, -2.0262451171875, -1.928985595703125, -1.83172607421875, -1.734466552734375, -1.63720703125, -1.539947509765625, -1.44268798828125, -1.345428466796875, -1.2481689453125, -1.150909423828125, -1.05364990234375, -0.956390380859375, -0.859130859375, -0.761871337890625, -0.66461181640625, -0.567352294921875, -0.4700927734375, -0.372833251953125, -0.27557373046875, -0.178314208984375, -0.0810546875, 0.016204833984375, 0.11346435546875, 0.210723876953125, 0.3079833984375, 0.405242919921875, 0.50250244140625, 0.599761962890625, 0.697021484375, 0.794281005859375, 0.89154052734375, 0.988800048828125, 1.0860595703125, 1.183319091796875, 1.28057861328125, 1.377838134765625, 1.47509765625, 1.572357177734375, 1.66961669921875, 1.766876220703125, 1.8641357421875, 1.961395263671875, 2.05865478515625, 2.155914306640625, 2.253173828125, 2.350433349609375, 2.44769287109375, 2.544952392578125, 2.6422119140625, 2.739471435546875, 2.83673095703125, 2.933990478515625, 3.03125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 11.0, 16.0, 18.0, 20.0, 18.0, 26.0, 41.0, 45.0, 74.0, 114.0, 153.0, 222.0, 305.0, 516.0, 785.0, 576.0, 323.0, 227.0, 164.0, 107.0, 67.0, 68.0, 50.0, 35.0, 25.0, 16.0, 10.0, 9.0, 10.0, 9.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.25, -3.136474609375, -3.02294921875, -2.909423828125, -2.7958984375, -2.682373046875, -2.56884765625, -2.455322265625, -2.341796875, -2.228271484375, -2.11474609375, -2.001220703125, -1.8876953125, -1.774169921875, -1.66064453125, -1.547119140625, -1.43359375, -1.320068359375, -1.20654296875, -1.093017578125, -0.9794921875, -0.865966796875, -0.75244140625, -0.638916015625, -0.525390625, -0.411865234375, -0.29833984375, -0.184814453125, -0.0712890625, 0.042236328125, 0.15576171875, 0.269287109375, 0.3828125, 0.496337890625, 0.60986328125, 0.723388671875, 0.8369140625, 0.950439453125, 1.06396484375, 1.177490234375, 1.291015625, 1.404541015625, 1.51806640625, 1.631591796875, 1.7451171875, 1.858642578125, 1.97216796875, 2.085693359375, 2.19921875, 2.312744140625, 2.42626953125, 2.539794921875, 2.6533203125, 2.766845703125, 2.88037109375, 2.993896484375, 3.107421875, 3.220947265625, 3.33447265625, 3.447998046875, 3.5615234375, 3.675048828125, 3.78857421875, 3.902099609375, 4.015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 10.0, 14.0, 15.0, 38.0, 51.0, 86.0, 103.0, 129.0, 132.0, 110.0, 102.0, 78.0, 42.0, 39.0, 20.0, 8.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-28.697418212890625, -28.034278869628906, -27.371139526367188, -26.70800018310547, -26.04486083984375, -25.3817195892334, -24.71858024597168, -24.05544090270996, -23.392301559448242, -22.729162216186523, -22.066022872924805, -21.402883529663086, -20.739742279052734, -20.076602935791016, -19.413463592529297, -18.750324249267578, -18.08718490600586, -17.42404556274414, -16.760906219482422, -16.097766876220703, -15.434626579284668, -14.77148723602295, -14.108346939086914, -13.445207595825195, -12.782068252563477, -12.118928909301758, -11.455789566040039, -10.792649269104004, -10.129509925842285, -9.466370582580566, -8.803230285644531, -8.140090942382812, -7.476951599121094, -6.813812255859375, -6.150672435760498, -5.487532615661621, -4.824393272399902, -4.161253929138184, -3.4981141090393066, -2.8349742889404297, -2.171834945678711, -1.508695363998413, -0.8455557823181152, -0.18241620063781738, 0.48072338104248047, 1.1438629627227783, 1.8070025444030762, 2.470142364501953, 3.133281707763672, 3.7964212894439697, 4.459560871124268, 5.1227006912231445, 5.785840034484863, 6.448979377746582, 7.112119197845459, 7.775259017944336, 8.438398361206055, 9.101537704467773, 9.764677047729492, 10.427817344665527, 11.090956687927246, 11.754096031188965, 12.417236328125, 13.080375671386719, 13.743515014648438]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 3.0, 6.0, 8.0, 12.0, 16.0, 19.0, 10.0, 17.0, 24.0, 25.0, 26.0, 28.0, 34.0, 38.0, 26.0, 20.0, 40.0, 32.0, 39.0, 49.0, 35.0, 43.0, 44.0, 33.0, 40.0, 41.0, 32.0, 28.0, 37.0, 21.0, 8.0, 24.0, 17.0, 22.0, 17.0, 13.0, 8.0, 12.0, 10.0, 8.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.769560813903809, -8.477986335754395, -8.18641185760498, -7.894836902618408, -7.603261947631836, -7.311687469482422, -7.020112991333008, -6.728538513183594, -6.4369635581970215, -6.145389080047607, -5.853814125061035, -5.562239646911621, -5.270665168762207, -4.979090213775635, -4.687515735626221, -4.395940780639648, -4.104366302490234, -3.812791585922241, -3.521216869354248, -3.229642391204834, -2.938067674636841, -2.6464929580688477, -2.3549184799194336, -2.0633437633514404, -1.7717690467834473, -1.480194330215454, -1.1886197328567505, -0.8970450758934021, -0.6054704189300537, -0.31389570236206055, -0.022321105003356934, 0.2692534923553467, 0.5608272552490234, 0.8524019122123718, 1.1439765691757202, 1.4355511665344238, 1.727125883102417, 2.01870059967041, 2.310275077819824, 2.6018497943878174, 2.8934245109558105, 3.1849992275238037, 3.476573944091797, 3.768148422241211, 4.059722900390625, 4.351297855377197, 4.642872333526611, 4.934447288513184, 5.226021766662598, 5.517596244812012, 5.809171199798584, 6.100745677947998, 6.39232063293457, 6.683895111083984, 6.975469589233398, 7.2670440673828125, 7.558619022369385, 7.850193500518799, 8.141768455505371, 8.433342933654785, 8.7249174118042, 9.01649284362793, 9.308067321777344, 9.599641799926758, 9.891216278076172]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 11.0, 16.0, 16.0, 42.0, 36.0, 84.0, 141.0, 202.0, 281.0, 395.0, 687.0, 937.0, 1458.0, 2122.0, 3332.0, 5097.0, 8104.0, 13892.0, 25153.0, 52236.0, 124719.0, 273903.0, 284112.0, 132206.0, 54988.0, 26464.0, 14158.0, 8351.0, 5306.0, 3368.0, 2231.0, 1475.0, 1019.0, 659.0, 437.0, 320.0, 194.0, 164.0, 76.0, 57.0, 37.0, 29.0, 17.0, 10.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -2.0853118896484375, -2.022186279296875, -1.9590606689453125, -1.89593505859375, -1.8328094482421875, -1.769683837890625, -1.7065582275390625, -1.6434326171875, -1.5803070068359375, -1.517181396484375, -1.4540557861328125, -1.39093017578125, -1.3278045654296875, -1.264678955078125, -1.2015533447265625, -1.138427734375, -1.0753021240234375, -1.012176513671875, -0.9490509033203125, -0.88592529296875, -0.8227996826171875, -0.759674072265625, -0.6965484619140625, -0.6334228515625, -0.5702972412109375, -0.507171630859375, -0.4440460205078125, -0.38092041015625, -0.3177947998046875, -0.254669189453125, -0.1915435791015625, -0.12841796875, -0.0652923583984375, -0.002166748046875, 0.0609588623046875, 0.12408447265625, 0.1872100830078125, 0.250335693359375, 0.3134613037109375, 0.3765869140625, 0.4397125244140625, 0.502838134765625, 0.5659637451171875, 0.62908935546875, 0.6922149658203125, 0.755340576171875, 0.8184661865234375, 0.881591796875, 0.9447174072265625, 1.007843017578125, 1.0709686279296875, 1.13409423828125, 1.1972198486328125, 1.260345458984375, 1.3234710693359375, 1.3865966796875, 1.4497222900390625, 1.512847900390625, 1.5759735107421875, 1.63909912109375, 1.7022247314453125, 1.765350341796875, 1.8284759521484375, 1.8916015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 9.0, 5.0, 12.0, 16.0, 20.0, 10.0, 18.0, 17.0, 30.0, 22.0, 38.0, 53.0, 45.0, 33.0, 50.0, 52.0, 42.0, 51.0, 53.0, 48.0, 46.0, 41.0, 33.0, 36.0, 31.0, 40.0, 23.0, 15.0, 19.0, 29.0, 9.0, 7.0, 9.0, 10.0, 13.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.658203125, -1.6053314208984375, -1.552459716796875, -1.4995880126953125, -1.44671630859375, -1.3938446044921875, -1.340972900390625, -1.2881011962890625, -1.2352294921875, -1.1823577880859375, -1.129486083984375, -1.0766143798828125, -1.02374267578125, -0.9708709716796875, -0.917999267578125, -0.8651275634765625, -0.812255859375, -0.7593841552734375, -0.706512451171875, -0.6536407470703125, -0.60076904296875, -0.5478973388671875, -0.495025634765625, -0.4421539306640625, -0.3892822265625, -0.3364105224609375, -0.283538818359375, -0.2306671142578125, -0.17779541015625, -0.1249237060546875, -0.072052001953125, -0.0191802978515625, 0.03369140625, 0.0865631103515625, 0.139434814453125, 0.1923065185546875, 0.24517822265625, 0.2980499267578125, 0.350921630859375, 0.4037933349609375, 0.4566650390625, 0.5095367431640625, 0.562408447265625, 0.6152801513671875, 0.66815185546875, 0.7210235595703125, 0.773895263671875, 0.8267669677734375, 0.879638671875, 0.9325103759765625, 0.985382080078125, 1.0382537841796875, 1.09112548828125, 1.1439971923828125, 1.196868896484375, 1.2497406005859375, 1.3026123046875, 1.3554840087890625, 1.408355712890625, 1.4612274169921875, 1.51409912109375, 1.5669708251953125, 1.619842529296875, 1.6727142333984375, 1.7255859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 5.0, 8.0, 12.0, 14.0, 27.0, 39.0, 61.0, 94.0, 149.0, 170.0, 297.0, 458.0, 789.0, 1407.0, 2445.0, 4173.0, 7442.0, 14038.0, 27424.0, 63894.0, 170449.0, 338594.0, 243915.0, 94651.0, 37597.0, 18080.0, 9651.0, 5320.0, 3001.0, 1686.0, 1043.0, 592.0, 371.0, 229.0, 135.0, 88.0, 55.0, 38.0, 38.0, 30.0, 13.0, 9.0, 6.0, 7.0, 5.0, 7.0, 3.0, 1.0, 2.0], "bins": [-2.623046875, -2.55157470703125, -2.4801025390625, -2.40863037109375, -2.337158203125, -2.26568603515625, -2.1942138671875, -2.12274169921875, -2.05126953125, -1.97979736328125, -1.9083251953125, -1.83685302734375, -1.765380859375, -1.69390869140625, -1.6224365234375, -1.55096435546875, -1.4794921875, -1.40802001953125, -1.3365478515625, -1.26507568359375, -1.193603515625, -1.12213134765625, -1.0506591796875, -0.97918701171875, -0.90771484375, -0.83624267578125, -0.7647705078125, -0.69329833984375, -0.621826171875, -0.55035400390625, -0.4788818359375, -0.40740966796875, -0.3359375, -0.26446533203125, -0.1929931640625, -0.12152099609375, -0.050048828125, 0.02142333984375, 0.0928955078125, 0.16436767578125, 0.23583984375, 0.30731201171875, 0.3787841796875, 0.45025634765625, 0.521728515625, 0.59320068359375, 0.6646728515625, 0.73614501953125, 0.8076171875, 0.87908935546875, 0.9505615234375, 1.02203369140625, 1.093505859375, 1.16497802734375, 1.2364501953125, 1.30792236328125, 1.37939453125, 1.45086669921875, 1.5223388671875, 1.59381103515625, 1.665283203125, 1.73675537109375, 1.8082275390625, 1.87969970703125, 1.951171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 9.0, 13.0, 13.0, 11.0, 23.0, 21.0, 30.0, 27.0, 24.0, 29.0, 26.0, 31.0, 37.0, 33.0, 29.0, 36.0, 37.0, 49.0, 50.0, 37.0, 39.0, 33.0, 30.0, 29.0, 41.0, 29.0, 22.0, 22.0, 20.0, 32.0, 20.0, 19.0, 11.0, 15.0, 10.0, 8.0, 11.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.21875, -4.093963623046875, -3.96917724609375, -3.844390869140625, -3.7196044921875, -3.594818115234375, -3.47003173828125, -3.345245361328125, -3.220458984375, -3.095672607421875, -2.97088623046875, -2.846099853515625, -2.7213134765625, -2.596527099609375, -2.47174072265625, -2.346954345703125, -2.22216796875, -2.097381591796875, -1.97259521484375, -1.847808837890625, -1.7230224609375, -1.598236083984375, -1.47344970703125, -1.348663330078125, -1.223876953125, -1.099090576171875, -0.97430419921875, -0.849517822265625, -0.7247314453125, -0.599945068359375, -0.47515869140625, -0.350372314453125, -0.2255859375, -0.100799560546875, 0.02398681640625, 0.148773193359375, 0.2735595703125, 0.398345947265625, 0.52313232421875, 0.647918701171875, 0.772705078125, 0.897491455078125, 1.02227783203125, 1.147064208984375, 1.2718505859375, 1.396636962890625, 1.52142333984375, 1.646209716796875, 1.77099609375, 1.895782470703125, 2.02056884765625, 2.145355224609375, 2.2701416015625, 2.394927978515625, 2.51971435546875, 2.644500732421875, 2.769287109375, 2.894073486328125, 3.01885986328125, 3.143646240234375, 3.2684326171875, 3.393218994140625, 3.51800537109375, 3.642791748046875, 3.767578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 9.0, 15.0, 18.0, 13.0, 29.0, 34.0, 65.0, 104.0, 147.0, 241.0, 341.0, 567.0, 852.0, 1336.0, 1961.0, 3396.0, 5485.0, 8954.0, 15323.0, 26728.0, 47638.0, 89128.0, 163309.0, 235491.0, 196975.0, 111445.0, 59242.0, 32917.0, 18762.0, 10725.0, 6436.0, 3949.0, 2556.0, 1542.0, 981.0, 629.0, 402.0, 265.0, 172.0, 118.0, 81.0, 45.0, 32.0, 35.0, 16.0, 18.0, 12.0, 6.0, 7.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7021484375, -0.6799850463867188, -0.6578216552734375, -0.6356582641601562, -0.613494873046875, -0.5913314819335938, -0.5691680908203125, -0.5470046997070312, -0.52484130859375, -0.5026779174804688, -0.4805145263671875, -0.45835113525390625, -0.436187744140625, -0.41402435302734375, -0.3918609619140625, -0.36969757080078125, -0.3475341796875, -0.32537078857421875, -0.3032073974609375, -0.28104400634765625, -0.258880615234375, -0.23671722412109375, -0.2145538330078125, -0.19239044189453125, -0.17022705078125, -0.14806365966796875, -0.1259002685546875, -0.10373687744140625, -0.081573486328125, -0.05941009521484375, -0.0372467041015625, -0.01508331298828125, 0.007080078125, 0.02924346923828125, 0.0514068603515625, 0.07357025146484375, 0.095733642578125, 0.11789703369140625, 0.1400604248046875, 0.16222381591796875, 0.18438720703125, 0.20655059814453125, 0.2287139892578125, 0.25087738037109375, 0.273040771484375, 0.29520416259765625, 0.3173675537109375, 0.33953094482421875, 0.3616943359375, 0.38385772705078125, 0.4060211181640625, 0.42818450927734375, 0.450347900390625, 0.47251129150390625, 0.4946746826171875, 0.5168380737304688, 0.53900146484375, 0.5611648559570312, 0.5833282470703125, 0.6054916381835938, 0.627655029296875, 0.6498184204101562, 0.6719818115234375, 0.6941452026367188, 0.71630859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 5.0, 3.0, 4.0, 6.0, 8.0, 12.0, 20.0, 25.0, 35.0, 56.0, 88.0, 104.0, 129.0, 145.0, 96.0, 82.0, 35.0, 37.0, 24.0, 19.0, 15.0, 8.0, 9.0, 7.0, 10.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00032067298889160156, -0.0003102831542491913, -0.000299893319606781, -0.00028950348496437073, -0.00027911365032196045, -0.00026872381567955017, -0.0002583339810371399, -0.0002479441463947296, -0.00023755431175231934, -0.00022716447710990906, -0.00021677464246749878, -0.0002063848078250885, -0.00019599497318267822, -0.00018560513854026794, -0.00017521530389785767, -0.0001648254692554474, -0.0001544356346130371, -0.00014404579997062683, -0.00013365596532821655, -0.00012326613068580627, -0.000112876296043396, -0.00010248646140098572, -9.209662675857544e-05, -8.170679211616516e-05, -7.131695747375488e-05, -6.0927122831344604e-05, -5.0537288188934326e-05, -4.014745354652405e-05, -2.975761890411377e-05, -1.936778426170349e-05, -8.977949619293213e-06, 1.4118850231170654e-06, 1.1801719665527344e-05, 2.2191554307937622e-05, 3.25813889503479e-05, 4.297122359275818e-05, 5.336105823516846e-05, 6.375089287757874e-05, 7.414072751998901e-05, 8.453056216239929e-05, 9.492039680480957e-05, 0.00010531023144721985, 0.00011570006608963013, 0.0001260899007320404, 0.00013647973537445068, 0.00014686957001686096, 0.00015725940465927124, 0.00016764923930168152, 0.0001780390739440918, 0.00018842890858650208, 0.00019881874322891235, 0.00020920857787132263, 0.0002195984125137329, 0.0002299882471561432, 0.00024037808179855347, 0.00025076791644096375, 0.000261157751083374, 0.0002715475857257843, 0.0002819374203681946, 0.00029232725501060486, 0.00030271708965301514, 0.0003131069242954254, 0.0003234967589378357, 0.00033388659358024597, 0.00034427642822265625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 10.0, 4.0, 12.0, 14.0, 25.0, 36.0, 58.0, 104.0, 150.0, 237.0, 367.0, 608.0, 1012.0, 1767.0, 3138.0, 5514.0, 10002.0, 18346.0, 34348.0, 65574.0, 124398.0, 203298.0, 227634.0, 161097.0, 88826.0, 47006.0, 24732.0, 13290.0, 7326.0, 4055.0, 2213.0, 1334.0, 758.0, 494.0, 280.0, 182.0, 90.0, 73.0, 48.0, 42.0, 14.0, 17.0, 8.0, 7.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.77099609375, -0.7470779418945312, -0.7231597900390625, -0.6992416381835938, -0.675323486328125, -0.6514053344726562, -0.6274871826171875, -0.6035690307617188, -0.57965087890625, -0.5557327270507812, -0.5318145751953125, -0.5078964233398438, -0.483978271484375, -0.46006011962890625, -0.4361419677734375, -0.41222381591796875, -0.3883056640625, -0.36438751220703125, -0.3404693603515625, -0.31655120849609375, -0.292633056640625, -0.26871490478515625, -0.2447967529296875, -0.22087860107421875, -0.19696044921875, -0.17304229736328125, -0.1491241455078125, -0.12520599365234375, -0.101287841796875, -0.07736968994140625, -0.0534515380859375, -0.02953338623046875, -0.005615234375, 0.01830291748046875, 0.0422210693359375, 0.06613922119140625, 0.090057373046875, 0.11397552490234375, 0.1378936767578125, 0.16181182861328125, 0.18572998046875, 0.20964813232421875, 0.2335662841796875, 0.25748443603515625, 0.281402587890625, 0.30532073974609375, 0.3292388916015625, 0.35315704345703125, 0.3770751953125, 0.40099334716796875, 0.4249114990234375, 0.44882965087890625, 0.472747802734375, 0.49666595458984375, 0.5205841064453125, 0.5445022583007812, 0.56842041015625, 0.5923385620117188, 0.6162567138671875, 0.6401748657226562, 0.664093017578125, 0.6880111694335938, 0.7119293212890625, 0.7358474731445312, 0.759765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 3.0, 3.0, 4.0, 8.0, 9.0, 13.0, 10.0, 14.0, 12.0, 16.0, 18.0, 23.0, 45.0, 41.0, 53.0, 52.0, 53.0, 69.0, 74.0, 68.0, 59.0, 51.0, 50.0, 52.0, 41.0, 31.0, 19.0, 14.0, 16.0, 18.0, 11.0, 8.0, 9.0, 6.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.267578125, -1.2347640991210938, -1.2019500732421875, -1.1691360473632812, -1.136322021484375, -1.1035079956054688, -1.0706939697265625, -1.0378799438476562, -1.00506591796875, -0.9722518920898438, -0.9394378662109375, -0.9066238403320312, -0.873809814453125, -0.8409957885742188, -0.8081817626953125, -0.7753677368164062, -0.7425537109375, -0.7097396850585938, -0.6769256591796875, -0.6441116333007812, -0.611297607421875, -0.5784835815429688, -0.5456695556640625, -0.5128555297851562, -0.48004150390625, -0.44722747802734375, -0.4144134521484375, -0.38159942626953125, -0.348785400390625, -0.31597137451171875, -0.2831573486328125, -0.25034332275390625, -0.217529296875, -0.18471527099609375, -0.1519012451171875, -0.11908721923828125, -0.086273193359375, -0.05345916748046875, -0.0206451416015625, 0.01216888427734375, 0.04498291015625, 0.07779693603515625, 0.1106109619140625, 0.14342498779296875, 0.176239013671875, 0.20905303955078125, 0.2418670654296875, 0.27468109130859375, 0.3074951171875, 0.34030914306640625, 0.3731231689453125, 0.40593719482421875, 0.438751220703125, 0.47156524658203125, 0.5043792724609375, 0.5371932983398438, 0.57000732421875, 0.6028213500976562, 0.6356353759765625, 0.6684494018554688, 0.701263427734375, 0.7340774536132812, 0.7668914794921875, 0.7997055053710938, 0.83251953125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 9.0, 19.0, 39.0, 81.0, 130.0, 149.0, 200.0, 156.0, 122.0, 51.0, 26.0, 11.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.805679321289062, -15.066817283630371, -14.32795524597168, -13.589094161987305, -12.850232124328613, -12.111370086669922, -11.372509002685547, -10.633646965026855, -9.894784927368164, -9.155922889709473, -8.417060852050781, -7.678199768066406, -6.939337730407715, -6.200475692749023, -5.46161413192749, -4.722752571105957, -3.9838905334472656, -3.2450287342071533, -2.506166934967041, -1.7673051357269287, -1.0284433364868164, -0.2895815372467041, 0.4492802619934082, 1.1881418228149414, 1.9270038604736328, 2.665865659713745, 3.4047274589538574, 4.143589019775391, 4.882451057434082, 5.621313095092773, 6.360174655914307, 7.09903621673584, 7.837896347045898, 8.57675838470459, 9.315620422363281, 10.054481506347656, 10.793343544006348, 11.532205581665039, 12.271066665649414, 13.009928703308105, 13.748790740966797, 14.487652778625488, 15.22651481628418, 15.965375900268555, 16.704238891601562, 17.443099975585938, 18.181961059570312, 18.920822143554688, 19.659685134887695, 20.39854621887207, 21.137409210205078, 21.876270294189453, 22.615131378173828, 23.353994369506836, 24.09285545349121, 24.83171844482422, 25.570579528808594, 26.30944061279297, 27.048303604125977, 27.78716468811035, 28.52602767944336, 29.264888763427734, 30.00374984741211, 30.742610931396484, 31.481473922729492]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 13.0, 13.0, 12.0, 22.0, 20.0, 25.0, 24.0, 45.0, 28.0, 30.0, 39.0, 43.0, 33.0, 40.0, 40.0, 36.0, 40.0, 36.0, 36.0, 40.0, 36.0, 42.0, 34.0, 28.0, 32.0, 26.0, 30.0, 23.0, 14.0, 17.0, 16.0, 16.0, 10.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.92996597290039, -12.569768905639648, -12.209572792053223, -11.84937572479248, -11.489179611206055, -11.128982543945312, -10.76878547668457, -10.408589363098145, -10.048393249511719, -9.688196182250977, -9.32800006866455, -8.967803001403809, -8.607606887817383, -8.24740982055664, -7.887213230133057, -7.527016639709473, -7.1668195724487305, -6.8066229820251465, -6.4464263916015625, -6.08622932434082, -5.7260332107543945, -5.365836143493652, -5.005639553070068, -4.645442962646484, -4.2852463722229, -3.9250497817993164, -3.5648531913757324, -3.2046563625335693, -2.8444597721099854, -2.4842631816864014, -2.1240663528442383, -1.7638697624206543, -1.403672218322754, -1.04347562789917, -0.6832789182662964, -0.32308220863342285, 0.03711438179016113, 0.3973109722137451, 0.7575078010559082, 1.1177043914794922, 1.4779009819030762, 1.8380975723266602, 2.198294162750244, 2.5584909915924072, 2.918687582015991, 3.278884172439575, 3.6390810012817383, 3.9992775917053223, 4.359474182128906, 4.71967077255249, 5.079867362976074, 5.440064430236816, 5.800260543823242, 6.160457611083984, 6.520654201507568, 6.880850791931152, 7.241047382354736, 7.60124397277832, 7.961440563201904, 8.321637153625488, 8.68183422088623, 9.042030334472656, 9.402227401733398, 9.76242446899414, 10.122620582580566]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 13.0, 12.0, 13.0, 26.0, 25.0, 47.0, 75.0, 89.0, 156.0, 235.0, 361.0, 607.0, 1034.0, 2019.0, 3895.0, 7796.0, 17077.0, 41305.0, 109771.0, 348469.0, 1485683.0, 1603979.0, 375192.0, 117300.0, 43801.0, 18271.0, 8307.0, 3971.0, 2004.0, 1132.0, 610.0, 366.0, 233.0, 135.0, 82.0, 58.0, 46.0, 29.0, 21.0, 13.0, 8.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01171875, -2.928131103515625, -2.84454345703125, -2.760955810546875, -2.6773681640625, -2.593780517578125, -2.51019287109375, -2.426605224609375, -2.343017578125, -2.259429931640625, -2.17584228515625, -2.092254638671875, -2.0086669921875, -1.925079345703125, -1.84149169921875, -1.757904052734375, -1.67431640625, -1.590728759765625, -1.50714111328125, -1.423553466796875, -1.3399658203125, -1.256378173828125, -1.17279052734375, -1.089202880859375, -1.005615234375, -0.922027587890625, -0.83843994140625, -0.754852294921875, -0.6712646484375, -0.587677001953125, -0.50408935546875, -0.420501708984375, -0.3369140625, -0.253326416015625, -0.16973876953125, -0.086151123046875, -0.0025634765625, 0.081024169921875, 0.16461181640625, 0.248199462890625, 0.331787109375, 0.415374755859375, 0.49896240234375, 0.582550048828125, 0.6661376953125, 0.749725341796875, 0.83331298828125, 0.916900634765625, 1.00048828125, 1.084075927734375, 1.16766357421875, 1.251251220703125, 1.3348388671875, 1.418426513671875, 1.50201416015625, 1.585601806640625, 1.669189453125, 1.752777099609375, 1.83636474609375, 1.919952392578125, 2.0035400390625, 2.087127685546875, 2.17071533203125, 2.254302978515625, 2.337890625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 7.0, 8.0, 10.0, 12.0, 7.0, 16.0, 16.0, 18.0, 18.0, 23.0, 33.0, 31.0, 33.0, 37.0, 43.0, 45.0, 48.0, 49.0, 40.0, 35.0, 41.0, 38.0, 39.0, 34.0, 45.0, 32.0, 30.0, 28.0, 28.0, 21.0, 15.0, 19.0, 17.0, 13.0, 9.0, 12.0, 10.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.34375, -1.29754638671875, -1.2513427734375, -1.20513916015625, -1.158935546875, -1.11273193359375, -1.0665283203125, -1.02032470703125, -0.97412109375, -0.92791748046875, -0.8817138671875, -0.83551025390625, -0.789306640625, -0.74310302734375, -0.6968994140625, -0.65069580078125, -0.6044921875, -0.55828857421875, -0.5120849609375, -0.46588134765625, -0.419677734375, -0.37347412109375, -0.3272705078125, -0.28106689453125, -0.23486328125, -0.18865966796875, -0.1424560546875, -0.09625244140625, -0.050048828125, -0.00384521484375, 0.0423583984375, 0.08856201171875, 0.134765625, 0.18096923828125, 0.2271728515625, 0.27337646484375, 0.319580078125, 0.36578369140625, 0.4119873046875, 0.45819091796875, 0.50439453125, 0.55059814453125, 0.5968017578125, 0.64300537109375, 0.689208984375, 0.73541259765625, 0.7816162109375, 0.82781982421875, 0.8740234375, 0.92022705078125, 0.9664306640625, 1.01263427734375, 1.058837890625, 1.10504150390625, 1.1512451171875, 1.19744873046875, 1.24365234375, 1.28985595703125, 1.3360595703125, 1.38226318359375, 1.428466796875, 1.47467041015625, 1.5208740234375, 1.56707763671875, 1.61328125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 3.0, 6.0, 8.0, 10.0, 22.0, 18.0, 32.0, 44.0, 81.0, 151.0, 247.0, 483.0, 1125.0, 2731.0, 7923.0, 25051.0, 95344.0, 464482.0, 2740272.0, 683070.0, 125355.0, 32117.0, 9688.0, 3428.0, 1348.0, 548.0, 292.0, 169.0, 74.0, 51.0, 42.0, 24.0, 17.0, 11.0, 6.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.81640625, -3.67291259765625, -3.5294189453125, -3.38592529296875, -3.242431640625, -3.09893798828125, -2.9554443359375, -2.81195068359375, -2.66845703125, -2.52496337890625, -2.3814697265625, -2.23797607421875, -2.094482421875, -1.95098876953125, -1.8074951171875, -1.66400146484375, -1.5205078125, -1.37701416015625, -1.2335205078125, -1.09002685546875, -0.946533203125, -0.80303955078125, -0.6595458984375, -0.51605224609375, -0.37255859375, -0.22906494140625, -0.0855712890625, 0.05792236328125, 0.201416015625, 0.34490966796875, 0.4884033203125, 0.63189697265625, 0.775390625, 0.91888427734375, 1.0623779296875, 1.20587158203125, 1.349365234375, 1.49285888671875, 1.6363525390625, 1.77984619140625, 1.92333984375, 2.06683349609375, 2.2103271484375, 2.35382080078125, 2.497314453125, 2.64080810546875, 2.7843017578125, 2.92779541015625, 3.0712890625, 3.21478271484375, 3.3582763671875, 3.50177001953125, 3.645263671875, 3.78875732421875, 3.9322509765625, 4.07574462890625, 4.21923828125, 4.36273193359375, 4.5062255859375, 4.64971923828125, 4.793212890625, 4.93670654296875, 5.0802001953125, 5.22369384765625, 5.3671875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 12.0, 8.0, 11.0, 13.0, 24.0, 31.0, 47.0, 64.0, 83.0, 142.0, 170.0, 302.0, 477.0, 763.0, 701.0, 416.0, 246.0, 172.0, 107.0, 80.0, 44.0, 53.0, 30.0, 24.0, 18.0, 9.0, 8.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.7503662109375, -4.610107421875, -4.4698486328125, -4.32958984375, -4.1893310546875, -4.049072265625, -3.9088134765625, -3.7685546875, -3.6282958984375, -3.488037109375, -3.3477783203125, -3.20751953125, -3.0672607421875, -2.927001953125, -2.7867431640625, -2.646484375, -2.5062255859375, -2.365966796875, -2.2257080078125, -2.08544921875, -1.9451904296875, -1.804931640625, -1.6646728515625, -1.5244140625, -1.3841552734375, -1.243896484375, -1.1036376953125, -0.96337890625, -0.8231201171875, -0.682861328125, -0.5426025390625, -0.40234375, -0.2620849609375, -0.121826171875, 0.0184326171875, 0.15869140625, 0.2989501953125, 0.439208984375, 0.5794677734375, 0.7197265625, 0.8599853515625, 1.000244140625, 1.1405029296875, 1.28076171875, 1.4210205078125, 1.561279296875, 1.7015380859375, 1.841796875, 1.9820556640625, 2.122314453125, 2.2625732421875, 2.40283203125, 2.5430908203125, 2.683349609375, 2.8236083984375, 2.9638671875, 3.1041259765625, 3.244384765625, 3.3846435546875, 3.52490234375, 3.6651611328125, 3.805419921875, 3.9456787109375, 4.0859375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 13.0, 7.0, 9.0, 22.0, 45.0, 67.0, 71.0, 107.0, 137.0, 142.0, 111.0, 94.0, 68.0, 47.0, 20.0, 18.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.525554656982422, -14.800288200378418, -14.075021743774414, -13.349756240844727, -12.624488830566406, -11.899223327636719, -11.173956871032715, -10.448690414428711, -9.723423957824707, -8.998157501220703, -8.2728910446167, -7.5476250648498535, -6.82235860824585, -6.097092151641846, -5.371826171875, -4.646559715270996, -3.921293258666992, -3.1960268020629883, -2.4707605838775635, -1.7454943656921387, -1.0202279090881348, -0.29496145248413086, 0.43030452728271484, 1.1555709838867188, 1.8808374404907227, 2.6061038970947266, 3.3313701152801514, 4.056636333465576, 4.78190279006958, 5.507169246673584, 6.23243522644043, 6.957701683044434, 7.68297004699707, 8.408236503601074, 9.133502960205078, 9.858768463134766, 10.584035873413086, 11.309301376342773, 12.034567832946777, 12.759834289550781, 13.485100746154785, 14.210367202758789, 14.935633659362793, 15.660900115966797, 16.386165618896484, 17.111433029174805, 17.836698532104492, 18.561965942382812, 19.2872314453125, 20.012496948242188, 20.737764358520508, 21.463029861450195, 22.188297271728516, 22.913562774658203, 23.63882827758789, 24.36409568786621, 25.08936309814453, 25.81462860107422, 26.53989601135254, 27.265161514282227, 27.990428924560547, 28.715694427490234, 29.440959930419922, 30.166227340698242, 30.89149284362793]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 1.0, 7.0, 2.0, 5.0, 9.0, 17.0, 20.0, 19.0, 22.0, 23.0, 23.0, 26.0, 22.0, 24.0, 29.0, 45.0, 34.0, 38.0, 40.0, 39.0, 36.0, 37.0, 42.0, 37.0, 39.0, 30.0, 31.0, 25.0, 33.0, 28.0, 26.0, 23.0, 19.0, 21.0, 14.0, 19.0, 19.0, 13.0, 10.0, 8.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.159262657165527, -9.850515365600586, -9.541768074035645, -9.233020782470703, -8.924274444580078, -8.615527153015137, -8.306779861450195, -7.998032569885254, -7.6892852783203125, -7.380537986755371, -7.07179069519043, -6.7630438804626465, -6.454296588897705, -6.145549297332764, -5.8368024826049805, -5.528055191040039, -5.219307899475098, -4.910560607910156, -4.601813316345215, -4.293066501617432, -3.9843192100524902, -3.675571918487549, -3.3668248653411865, -3.058077812194824, -2.749330520629883, -2.4405832290649414, -2.131836175918579, -1.8230890035629272, -1.5143418312072754, -1.2055946588516235, -0.8968474864959717, -0.5881004333496094, -0.2793540954589844, 0.02939307689666748, 0.33814024925231934, 0.6468874216079712, 0.955634593963623, 1.264381766319275, 1.5731289386749268, 1.881875991821289, 2.1906232833862305, 2.499370574951172, 2.808117628097534, 3.1168646812438965, 3.425611972808838, 3.7343592643737793, 4.0431060791015625, 4.351853370666504, 4.660600662231445, 4.969347953796387, 5.278095245361328, 5.586842060089111, 5.895589351654053, 6.204336643218994, 6.513083457946777, 6.821830749511719, 7.13057804107666, 7.439325332641602, 7.748072624206543, 8.056819915771484, 8.36556625366211, 8.67431354522705, 8.983060836791992, 9.291808128356934, 9.600555419921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 3.0, 7.0, 10.0, 15.0, 26.0, 43.0, 64.0, 67.0, 129.0, 196.0, 314.0, 448.0, 617.0, 970.0, 1397.0, 2156.0, 3194.0, 4472.0, 6823.0, 10706.0, 18168.0, 37653.0, 111625.0, 376851.0, 309672.0, 86102.0, 31834.0, 16093.0, 9536.0, 6386.0, 4186.0, 2820.0, 1955.0, 1338.0, 923.0, 575.0, 372.0, 252.0, 155.0, 134.0, 95.0, 55.0, 41.0, 20.0, 16.0, 8.0, 12.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.181640625, -3.0877685546875, -2.993896484375, -2.9000244140625, -2.80615234375, -2.7122802734375, -2.618408203125, -2.5245361328125, -2.4306640625, -2.3367919921875, -2.242919921875, -2.1490478515625, -2.05517578125, -1.9613037109375, -1.867431640625, -1.7735595703125, -1.6796875, -1.5858154296875, -1.491943359375, -1.3980712890625, -1.30419921875, -1.2103271484375, -1.116455078125, -1.0225830078125, -0.9287109375, -0.8348388671875, -0.740966796875, -0.6470947265625, -0.55322265625, -0.4593505859375, -0.365478515625, -0.2716064453125, -0.177734375, -0.0838623046875, 0.010009765625, 0.1038818359375, 0.19775390625, 0.2916259765625, 0.385498046875, 0.4793701171875, 0.5732421875, 0.6671142578125, 0.760986328125, 0.8548583984375, 0.94873046875, 1.0426025390625, 1.136474609375, 1.2303466796875, 1.32421875, 1.4180908203125, 1.511962890625, 1.6058349609375, 1.69970703125, 1.7935791015625, 1.887451171875, 1.9813232421875, 2.0751953125, 2.1690673828125, 2.262939453125, 2.3568115234375, 2.45068359375, 2.5445556640625, 2.638427734375, 2.7322998046875, 2.826171875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 8.0, 7.0, 8.0, 12.0, 5.0, 13.0, 16.0, 11.0, 13.0, 14.0, 27.0, 24.0, 23.0, 34.0, 24.0, 38.0, 32.0, 27.0, 33.0, 50.0, 38.0, 38.0, 26.0, 41.0, 34.0, 36.0, 39.0, 28.0, 37.0, 23.0, 27.0, 18.0, 22.0, 18.0, 19.0, 15.0, 15.0, 14.0, 10.0, 12.0, 11.0, 11.0, 11.0, 2.0, 5.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.3798828125, -1.3389739990234375, -1.298065185546875, -1.2571563720703125, -1.21624755859375, -1.1753387451171875, -1.134429931640625, -1.0935211181640625, -1.0526123046875, -1.0117034912109375, -0.970794677734375, -0.9298858642578125, -0.88897705078125, -0.8480682373046875, -0.807159423828125, -0.7662506103515625, -0.725341796875, -0.6844329833984375, -0.643524169921875, -0.6026153564453125, -0.56170654296875, -0.5207977294921875, -0.479888916015625, -0.4389801025390625, -0.3980712890625, -0.3571624755859375, -0.316253662109375, -0.2753448486328125, -0.23443603515625, -0.1935272216796875, -0.152618408203125, -0.1117095947265625, -0.07080078125, -0.0298919677734375, 0.011016845703125, 0.0519256591796875, 0.09283447265625, 0.1337432861328125, 0.174652099609375, 0.2155609130859375, 0.2564697265625, 0.2973785400390625, 0.338287353515625, 0.3791961669921875, 0.42010498046875, 0.4610137939453125, 0.501922607421875, 0.5428314208984375, 0.583740234375, 0.6246490478515625, 0.665557861328125, 0.7064666748046875, 0.74737548828125, 0.7882843017578125, 0.829193115234375, 0.8701019287109375, 0.9110107421875, 0.9519195556640625, 0.992828369140625, 1.0337371826171875, 1.07464599609375, 1.1155548095703125, 1.156463623046875, 1.1973724365234375, 1.23828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 5.0, 10.0, 9.0, 19.0, 30.0, 42.0, 63.0, 79.0, 149.0, 220.0, 378.0, 717.0, 1375.0, 2864.0, 6000.0, 13243.0, 29523.0, 83043.0, 395119.0, 382166.0, 79717.0, 28880.0, 12945.0, 5974.0, 2817.0, 1428.0, 715.0, 386.0, 237.0, 128.0, 74.0, 60.0, 42.0, 27.0, 23.0, 16.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.40625, -3.280029296875, -3.15380859375, -3.027587890625, -2.9013671875, -2.775146484375, -2.64892578125, -2.522705078125, -2.396484375, -2.270263671875, -2.14404296875, -2.017822265625, -1.8916015625, -1.765380859375, -1.63916015625, -1.512939453125, -1.38671875, -1.260498046875, -1.13427734375, -1.008056640625, -0.8818359375, -0.755615234375, -0.62939453125, -0.503173828125, -0.376953125, -0.250732421875, -0.12451171875, 0.001708984375, 0.1279296875, 0.254150390625, 0.38037109375, 0.506591796875, 0.6328125, 0.759033203125, 0.88525390625, 1.011474609375, 1.1376953125, 1.263916015625, 1.39013671875, 1.516357421875, 1.642578125, 1.768798828125, 1.89501953125, 2.021240234375, 2.1474609375, 2.273681640625, 2.39990234375, 2.526123046875, 2.65234375, 2.778564453125, 2.90478515625, 3.031005859375, 3.1572265625, 3.283447265625, 3.40966796875, 3.535888671875, 3.662109375, 3.788330078125, 3.91455078125, 4.040771484375, 4.1669921875, 4.293212890625, 4.41943359375, 4.545654296875, 4.671875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 6.0, 6.0, 9.0, 19.0, 17.0, 30.0, 37.0, 34.0, 48.0, 52.0, 49.0, 53.0, 74.0, 49.0, 78.0, 54.0, 58.0, 62.0, 39.0, 51.0, 21.0, 29.0, 24.0, 21.0, 19.0, 9.0, 10.0, 3.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73828125, -5.53778076171875, -5.3372802734375, -5.13677978515625, -4.936279296875, -4.73577880859375, -4.5352783203125, -4.33477783203125, -4.13427734375, -3.93377685546875, -3.7332763671875, -3.53277587890625, -3.332275390625, -3.13177490234375, -2.9312744140625, -2.73077392578125, -2.5302734375, -2.32977294921875, -2.1292724609375, -1.92877197265625, -1.728271484375, -1.52777099609375, -1.3272705078125, -1.12677001953125, -0.92626953125, -0.72576904296875, -0.5252685546875, -0.32476806640625, -0.124267578125, 0.07623291015625, 0.2767333984375, 0.47723388671875, 0.677734375, 0.87823486328125, 1.0787353515625, 1.27923583984375, 1.479736328125, 1.68023681640625, 1.8807373046875, 2.08123779296875, 2.28173828125, 2.48223876953125, 2.6827392578125, 2.88323974609375, 3.083740234375, 3.28424072265625, 3.4847412109375, 3.68524169921875, 3.8857421875, 4.08624267578125, 4.2867431640625, 4.48724365234375, 4.687744140625, 4.88824462890625, 5.0887451171875, 5.28924560546875, 5.48974609375, 5.69024658203125, 5.8907470703125, 6.09124755859375, 6.291748046875, 6.49224853515625, 6.6927490234375, 6.89324951171875, 7.09375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 6.0, 6.0, 6.0, 8.0, 20.0, 37.0, 33.0, 44.0, 60.0, 111.0, 194.0, 278.0, 432.0, 653.0, 1047.0, 1688.0, 2746.0, 4528.0, 7573.0, 13370.0, 26115.0, 56227.0, 141695.0, 333048.0, 266794.0, 101290.0, 42735.0, 20580.0, 10861.0, 6246.0, 3650.0, 2388.0, 1484.0, 960.0, 548.0, 375.0, 220.0, 157.0, 97.0, 61.0, 47.0, 45.0, 30.0, 17.0, 15.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.0869140625, -1.052764892578125, -1.01861572265625, -0.984466552734375, -0.9503173828125, -0.916168212890625, -0.88201904296875, -0.847869873046875, -0.813720703125, -0.779571533203125, -0.74542236328125, -0.711273193359375, -0.6771240234375, -0.642974853515625, -0.60882568359375, -0.574676513671875, -0.54052734375, -0.506378173828125, -0.47222900390625, -0.438079833984375, -0.4039306640625, -0.369781494140625, -0.33563232421875, -0.301483154296875, -0.267333984375, -0.233184814453125, -0.19903564453125, -0.164886474609375, -0.1307373046875, -0.096588134765625, -0.06243896484375, -0.028289794921875, 0.005859375, 0.040008544921875, 0.07415771484375, 0.108306884765625, 0.1424560546875, 0.176605224609375, 0.21075439453125, 0.244903564453125, 0.279052734375, 0.313201904296875, 0.34735107421875, 0.381500244140625, 0.4156494140625, 0.449798583984375, 0.48394775390625, 0.518096923828125, 0.55224609375, 0.586395263671875, 0.62054443359375, 0.654693603515625, 0.6888427734375, 0.722991943359375, 0.75714111328125, 0.791290283203125, 0.825439453125, 0.859588623046875, 0.89373779296875, 0.927886962890625, 0.9620361328125, 0.996185302734375, 1.03033447265625, 1.064483642578125, 1.0986328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 10.0, 13.0, 36.0, 59.0, 110.0, 223.0, 228.0, 125.0, 77.0, 22.0, 22.0, 19.0, 6.0, 5.0, 5.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00069427490234375, -0.0006726160645484924, -0.0006509572267532349, -0.0006292983889579773, -0.0006076395511627197, -0.0005859807133674622, -0.0005643218755722046, -0.000542663037776947, -0.0005210041999816895, -0.0004993453621864319, -0.0004776865243911743, -0.00045602768659591675, -0.0004343688488006592, -0.0004127100110054016, -0.00039105117321014404, -0.0003693923354148865, -0.0003477334976196289, -0.00032607465982437134, -0.00030441582202911377, -0.0002827569842338562, -0.00026109814643859863, -0.00023943930864334106, -0.0002177804708480835, -0.00019612163305282593, -0.00017446279525756836, -0.0001528039574623108, -0.00013114511966705322, -0.00010948628187179565, -8.782744407653809e-05, -6.616860628128052e-05, -4.450976848602295e-05, -2.285093069076538e-05, -1.1920928955078125e-06, 2.0466744899749756e-05, 4.2125582695007324e-05, 6.378442049026489e-05, 8.544325828552246e-05, 0.00010710209608078003, 0.0001287609338760376, 0.00015041977167129517, 0.00017207860946655273, 0.0001937374472618103, 0.00021539628505706787, 0.00023705512285232544, 0.000258713960647583, 0.0002803727984428406, 0.00030203163623809814, 0.0003236904740333557, 0.0003453493118286133, 0.00036700814962387085, 0.0003886669874191284, 0.000410325825214386, 0.00043198466300964355, 0.0004536435008049011, 0.0004753023386001587, 0.0004969611763954163, 0.0005186200141906738, 0.0005402788519859314, 0.000561937689781189, 0.0005835965275764465, 0.0006052553653717041, 0.0006269142031669617, 0.0006485730409622192, 0.0006702318787574768, 0.0006918907165527344]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 3.0, 3.0, 9.0, 6.0, 14.0, 17.0, 29.0, 49.0, 45.0, 74.0, 110.0, 140.0, 242.0, 368.0, 626.0, 1128.0, 1829.0, 3331.0, 6019.0, 11423.0, 23853.0, 53577.0, 130219.0, 271104.0, 286713.0, 144678.0, 59274.0, 26030.0, 12622.0, 6485.0, 3634.0, 1982.0, 1097.0, 646.0, 397.0, 256.0, 180.0, 107.0, 80.0, 45.0, 27.0, 27.0, 17.0, 14.0, 13.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.873046875, -0.8419342041015625, -0.810821533203125, -0.7797088623046875, -0.74859619140625, -0.7174835205078125, -0.686370849609375, -0.6552581787109375, -0.6241455078125, -0.5930328369140625, -0.561920166015625, -0.5308074951171875, -0.49969482421875, -0.4685821533203125, -0.437469482421875, -0.4063568115234375, -0.375244140625, -0.3441314697265625, -0.313018798828125, -0.2819061279296875, -0.25079345703125, -0.2196807861328125, -0.188568115234375, -0.1574554443359375, -0.1263427734375, -0.0952301025390625, -0.064117431640625, -0.0330047607421875, -0.00189208984375, 0.0292205810546875, 0.060333251953125, 0.0914459228515625, 0.12255859375, 0.1536712646484375, 0.184783935546875, 0.2158966064453125, 0.24700927734375, 0.2781219482421875, 0.309234619140625, 0.3403472900390625, 0.3714599609375, 0.4025726318359375, 0.433685302734375, 0.4647979736328125, 0.49591064453125, 0.5270233154296875, 0.558135986328125, 0.5892486572265625, 0.620361328125, 0.6514739990234375, 0.682586669921875, 0.7136993408203125, 0.74481201171875, 0.7759246826171875, 0.807037353515625, 0.8381500244140625, 0.8692626953125, 0.9003753662109375, 0.931488037109375, 0.9626007080078125, 0.99371337890625, 1.0248260498046875, 1.055938720703125, 1.0870513916015625, 1.1181640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 13.0, 9.0, 19.0, 18.0, 23.0, 25.0, 17.0, 24.0, 33.0, 40.0, 62.0, 56.0, 62.0, 54.0, 71.0, 55.0, 54.0, 54.0, 47.0, 44.0, 37.0, 30.0, 22.0, 19.0, 19.0, 17.0, 9.0, 3.0, 6.0, 4.0, 2.0, 4.0, 4.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97412109375, -0.9378738403320312, -0.9016265869140625, -0.8653793334960938, -0.829132080078125, -0.7928848266601562, -0.7566375732421875, -0.7203903198242188, -0.68414306640625, -0.6478958129882812, -0.6116485595703125, -0.5754013061523438, -0.539154052734375, -0.5029067993164062, -0.4666595458984375, -0.43041229248046875, -0.3941650390625, -0.35791778564453125, -0.3216705322265625, -0.28542327880859375, -0.249176025390625, -0.21292877197265625, -0.1766815185546875, -0.14043426513671875, -0.10418701171875, -0.06793975830078125, -0.0316925048828125, 0.00455474853515625, 0.040802001953125, 0.07704925537109375, 0.1132965087890625, 0.14954376220703125, 0.185791015625, 0.22203826904296875, 0.2582855224609375, 0.29453277587890625, 0.330780029296875, 0.36702728271484375, 0.4032745361328125, 0.43952178955078125, 0.47576904296875, 0.5120162963867188, 0.5482635498046875, 0.5845108032226562, 0.620758056640625, 0.6570053100585938, 0.6932525634765625, 0.7294998168945312, 0.7657470703125, 0.8019943237304688, 0.8382415771484375, 0.8744888305664062, 0.910736083984375, 0.9469833374023438, 0.9832305908203125, 1.0194778442382812, 1.05572509765625, 1.0919723510742188, 1.1282196044921875, 1.1644668579101562, 1.200714111328125, 1.2369613647460938, 1.2732086181640625, 1.3094558715820312, 1.345703125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 16.0, 55.0, 119.0, 256.0, 295.0, 175.0, 54.0, 18.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-56.889137268066406, -55.46892166137695, -54.048709869384766, -52.62849426269531, -51.208282470703125, -49.78806686401367, -48.36785125732422, -46.94763946533203, -45.52742385864258, -44.107208251953125, -42.68699645996094, -41.266780853271484, -39.84656524658203, -38.426353454589844, -37.00613784790039, -35.58592224121094, -34.16571044921875, -32.7454948425293, -31.32528305053711, -29.905067443847656, -28.484853744506836, -27.064640045166016, -25.644424438476562, -24.224210739135742, -22.803997039794922, -21.3837833404541, -19.96356964111328, -18.543354034423828, -17.123140335083008, -15.702926635742188, -14.28271198272705, -12.862497329711914, -11.442279815673828, -10.022066116333008, -8.601851463317871, -7.181637287139893, -5.761423110961914, -4.3412089347839355, -2.920994758605957, -1.5007801055908203, -0.08056640625, 1.3396477699279785, 2.759861946105957, 4.1800761222839355, 5.600290298461914, 7.020504474639893, 8.440718650817871, 9.860933303833008, 11.281147003173828, 12.701360702514648, 14.121575355529785, 15.541790008544922, 16.962003707885742, 18.382217407226562, 19.802433013916016, 21.222646713256836, 22.642860412597656, 24.063074111938477, 25.483287811279297, 26.90350341796875, 28.32371711730957, 29.74393081665039, 31.164146423339844, 32.58435821533203, 34.004573822021484]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 7.0, 5.0, 14.0, 13.0, 14.0, 20.0, 18.0, 27.0, 23.0, 40.0, 29.0, 35.0, 41.0, 32.0, 45.0, 40.0, 46.0, 33.0, 34.0, 47.0, 40.0, 42.0, 39.0, 37.0, 33.0, 34.0, 28.0, 30.0, 23.0, 23.0, 12.0, 18.0, 13.0, 10.0, 11.0, 5.0, 7.0, 6.0, 5.0, 5.0, 2.0, 2.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.129358291625977, -11.744454383850098, -11.359551429748535, -10.974647521972656, -10.589743614196777, -10.204839706420898, -9.819936752319336, -9.435032844543457, -9.050128936767578, -8.6652250289917, -8.280322074890137, -7.895418167114258, -7.510514259338379, -7.125610828399658, -6.7407073974609375, -6.355803489685059, -5.970900058746338, -5.585996627807617, -5.201092720031738, -4.816189289093018, -4.431285381317139, -4.046381950378418, -3.661478281021118, -3.2765746116638184, -2.8916709423065186, -2.5067672729492188, -2.121863603591919, -1.7369600534439087, -1.3520563840866089, -0.9671527147293091, -0.5822491645812988, -0.19734549522399902, 0.18755817413330078, 0.5724618434906006, 0.9573654532432556, 1.3422690629959106, 1.7271727323532104, 2.1120762825012207, 2.4969799518585205, 2.8818836212158203, 3.26678729057312, 3.65169095993042, 4.036594390869141, 4.4214982986450195, 4.80640172958374, 5.191305637359619, 5.57620906829834, 5.961112976074219, 6.3460164070129395, 6.73091983795166, 7.115823745727539, 7.50072717666626, 7.885631084442139, 8.27053451538086, 8.655438423156738, 9.040342330932617, 9.42524528503418, 9.810149192810059, 10.195052146911621, 10.5799560546875, 10.964859962463379, 11.349763870239258, 11.73466682434082, 12.1195707321167, 12.504474639892578]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 12.0, 11.0, 22.0, 25.0, 40.0, 46.0, 78.0, 114.0, 191.0, 286.0, 439.0, 730.0, 1297.0, 2610.0, 5722.0, 13106.0, 33701.0, 99867.0, 380969.0, 1872947.0, 1385367.0, 271834.0, 76409.0, 27116.0, 10842.0, 4891.0, 2376.0, 1323.0, 679.0, 438.0, 247.0, 170.0, 100.0, 82.0, 45.0, 51.0, 20.0, 22.0, 13.0, 12.0, 4.0, 2.0, 2.0, 6.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-3.255859375, -3.16253662109375, -3.0692138671875, -2.97589111328125, -2.882568359375, -2.78924560546875, -2.6959228515625, -2.60260009765625, -2.50927734375, -2.41595458984375, -2.3226318359375, -2.22930908203125, -2.135986328125, -2.04266357421875, -1.9493408203125, -1.85601806640625, -1.7626953125, -1.66937255859375, -1.5760498046875, -1.48272705078125, -1.389404296875, -1.29608154296875, -1.2027587890625, -1.10943603515625, -1.01611328125, -0.92279052734375, -0.8294677734375, -0.73614501953125, -0.642822265625, -0.54949951171875, -0.4561767578125, -0.36285400390625, -0.26953125, -0.17620849609375, -0.0828857421875, 0.01043701171875, 0.103759765625, 0.19708251953125, 0.2904052734375, 0.38372802734375, 0.47705078125, 0.57037353515625, 0.6636962890625, 0.75701904296875, 0.850341796875, 0.94366455078125, 1.0369873046875, 1.13031005859375, 1.2236328125, 1.31695556640625, 1.4102783203125, 1.50360107421875, 1.596923828125, 1.69024658203125, 1.7835693359375, 1.87689208984375, 1.97021484375, 2.06353759765625, 2.1568603515625, 2.25018310546875, 2.343505859375, 2.43682861328125, 2.5301513671875, 2.62347412109375, 2.716796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 5.0, 5.0, 9.0, 11.0, 14.0, 11.0, 19.0, 16.0, 16.0, 16.0, 23.0, 24.0, 26.0, 28.0, 33.0, 43.0, 42.0, 46.0, 36.0, 38.0, 47.0, 53.0, 39.0, 43.0, 33.0, 41.0, 38.0, 32.0, 22.0, 26.0, 37.0, 18.0, 14.0, 22.0, 13.0, 11.0, 15.0, 7.0, 6.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.580078125, -1.528533935546875, -1.47698974609375, -1.425445556640625, -1.3739013671875, -1.322357177734375, -1.27081298828125, -1.219268798828125, -1.167724609375, -1.116180419921875, -1.06463623046875, -1.013092041015625, -0.9615478515625, -0.910003662109375, -0.85845947265625, -0.806915283203125, -0.75537109375, -0.703826904296875, -0.65228271484375, -0.600738525390625, -0.5491943359375, -0.497650146484375, -0.44610595703125, -0.394561767578125, -0.343017578125, -0.291473388671875, -0.23992919921875, -0.188385009765625, -0.1368408203125, -0.085296630859375, -0.03375244140625, 0.017791748046875, 0.0693359375, 0.120880126953125, 0.17242431640625, 0.223968505859375, 0.2755126953125, 0.327056884765625, 0.37860107421875, 0.430145263671875, 0.481689453125, 0.533233642578125, 0.58477783203125, 0.636322021484375, 0.6878662109375, 0.739410400390625, 0.79095458984375, 0.842498779296875, 0.89404296875, 0.945587158203125, 0.99713134765625, 1.048675537109375, 1.1002197265625, 1.151763916015625, 1.20330810546875, 1.254852294921875, 1.306396484375, 1.357940673828125, 1.40948486328125, 1.461029052734375, 1.5125732421875, 1.564117431640625, 1.61566162109375, 1.667205810546875, 1.71875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 10.0, 12.0, 24.0, 33.0, 78.0, 100.0, 195.0, 399.0, 723.0, 1509.0, 3571.0, 10438.0, 39883.0, 200652.0, 2159780.0, 1566449.0, 161618.0, 33831.0, 9156.0, 3051.0, 1317.0, 605.0, 367.0, 179.0, 113.0, 66.0, 28.0, 27.0, 18.0, 14.0, 2.0, 7.0, 6.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.12188720703125, -4.9508056640625, -4.77972412109375, -4.608642578125, -4.43756103515625, -4.2664794921875, -4.09539794921875, -3.92431640625, -3.75323486328125, -3.5821533203125, -3.41107177734375, -3.239990234375, -3.06890869140625, -2.8978271484375, -2.72674560546875, -2.5556640625, -2.38458251953125, -2.2135009765625, -2.04241943359375, -1.871337890625, -1.70025634765625, -1.5291748046875, -1.35809326171875, -1.18701171875, -1.01593017578125, -0.8448486328125, -0.67376708984375, -0.502685546875, -0.33160400390625, -0.1605224609375, 0.01055908203125, 0.181640625, 0.35272216796875, 0.5238037109375, 0.69488525390625, 0.865966796875, 1.03704833984375, 1.2081298828125, 1.37921142578125, 1.55029296875, 1.72137451171875, 1.8924560546875, 2.06353759765625, 2.234619140625, 2.40570068359375, 2.5767822265625, 2.74786376953125, 2.9189453125, 3.09002685546875, 3.2611083984375, 3.43218994140625, 3.603271484375, 3.77435302734375, 3.9454345703125, 4.11651611328125, 4.28759765625, 4.45867919921875, 4.6297607421875, 4.80084228515625, 4.971923828125, 5.14300537109375, 5.3140869140625, 5.48516845703125, 5.65625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 8.0, 4.0, 3.0, 21.0, 19.0, 26.0, 43.0, 60.0, 79.0, 124.0, 177.0, 312.0, 559.0, 818.0, 679.0, 396.0, 236.0, 159.0, 85.0, 72.0, 53.0, 30.0, 29.0, 18.0, 19.0, 16.0, 2.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.4881591796875, -4.331787109375, -4.1754150390625, -4.01904296875, -3.8626708984375, -3.706298828125, -3.5499267578125, -3.3935546875, -3.2371826171875, -3.080810546875, -2.9244384765625, -2.76806640625, -2.6116943359375, -2.455322265625, -2.2989501953125, -2.142578125, -1.9862060546875, -1.829833984375, -1.6734619140625, -1.51708984375, -1.3607177734375, -1.204345703125, -1.0479736328125, -0.8916015625, -0.7352294921875, -0.578857421875, -0.4224853515625, -0.26611328125, -0.1097412109375, 0.046630859375, 0.2030029296875, 0.359375, 0.5157470703125, 0.672119140625, 0.8284912109375, 0.98486328125, 1.1412353515625, 1.297607421875, 1.4539794921875, 1.6103515625, 1.7667236328125, 1.923095703125, 2.0794677734375, 2.23583984375, 2.3922119140625, 2.548583984375, 2.7049560546875, 2.861328125, 3.0177001953125, 3.174072265625, 3.3304443359375, 3.48681640625, 3.6431884765625, 3.799560546875, 3.9559326171875, 4.1123046875, 4.2686767578125, 4.425048828125, 4.5814208984375, 4.73779296875, 4.8941650390625, 5.050537109375, 5.2069091796875, 5.36328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 9.0, 12.0, 33.0, 72.0, 115.0, 173.0, 167.0, 165.0, 103.0, 82.0, 32.0, 13.0, 13.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.73253631591797, -32.65579605102539, -31.579057693481445, -30.5023193359375, -29.425579071044922, -28.348840713500977, -27.27210235595703, -26.195362091064453, -25.118621826171875, -24.04188346862793, -22.96514320373535, -21.888404846191406, -20.811664581298828, -19.734926223754883, -18.658187866210938, -17.58144760131836, -16.504709243774414, -15.427969932556152, -14.35123062133789, -13.274492263793945, -12.197751998901367, -11.121013641357422, -10.04427433013916, -8.967535018920898, -7.890795707702637, -6.814056396484375, -5.737317085266113, -4.66057825088501, -3.583838939666748, -2.5070996284484863, -1.4303607940673828, -0.3536214828491211, 0.7231178283691406, 1.7998570203781128, 2.876596212387085, 3.9533352851867676, 5.030074596405029, 6.106813907623291, 7.1835527420043945, 8.260292053222656, 9.337031364440918, 10.41377067565918, 11.490509986877441, 12.567249298095703, 13.643987655639648, 14.720727920532227, 15.797466278076172, 16.87420654296875, 17.950944900512695, 19.02768325805664, 20.10442352294922, 21.181161880493164, 22.257902145385742, 23.334640502929688, 24.411380767822266, 25.48811912536621, 26.564857482910156, 27.6415958404541, 28.71833610534668, 29.795074462890625, 30.871814727783203, 31.94855308532715, 33.025291442871094, 34.10203170776367, 35.17877197265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 14.0, 10.0, 14.0, 16.0, 11.0, 14.0, 23.0, 27.0, 20.0, 35.0, 24.0, 22.0, 41.0, 31.0, 37.0, 32.0, 32.0, 40.0, 50.0, 42.0, 45.0, 32.0, 41.0, 26.0, 45.0, 34.0, 34.0, 26.0, 29.0, 23.0, 17.0, 15.0, 13.0, 10.0, 12.0, 7.0, 7.0, 9.0, 2.0, 1.0, 5.0, 7.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.403112411499023, -12.035148620605469, -11.667183876037598, -11.299219131469727, -10.931255340576172, -10.563291549682617, -10.195326805114746, -9.827362060546875, -9.45939826965332, -9.091434478759766, -8.723469734191895, -8.355504989624023, -7.987541198730469, -7.619576930999756, -7.251612663269043, -6.88364839553833, -6.515684127807617, -6.147719860076904, -5.779755592346191, -5.4117913246154785, -5.043827056884766, -4.675862789154053, -4.30789852142334, -3.939934253692627, -3.571969985961914, -3.204005718231201, -2.8360414505004883, -2.4680771827697754, -2.1001129150390625, -1.7321486473083496, -1.3641843795776367, -0.9962201118469238, -0.6282558441162109, -0.26029157638549805, 0.10767269134521484, 0.47563695907592773, 0.8436012268066406, 1.2115654945373535, 1.5795297622680664, 1.9474940299987793, 2.315458297729492, 2.683422565460205, 3.051386833190918, 3.419351100921631, 3.7873153686523438, 4.155279636383057, 4.5232439041137695, 4.891208171844482, 5.259172439575195, 5.627136707305908, 5.995100975036621, 6.363065242767334, 6.731029510498047, 7.09899377822876, 7.466958045959473, 7.8349223136901855, 8.202886581420898, 8.570850372314453, 8.938815116882324, 9.306779861450195, 9.67474365234375, 10.042707443237305, 10.410672187805176, 10.778636932373047, 11.146600723266602]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 7.0, 13.0, 9.0, 28.0, 40.0, 38.0, 87.0, 129.0, 148.0, 237.0, 356.0, 526.0, 762.0, 1195.0, 1731.0, 2614.0, 3952.0, 6206.0, 9329.0, 14719.0, 25348.0, 53694.0, 155237.0, 355555.0, 247430.0, 83311.0, 34142.0, 18631.0, 11504.0, 7411.0, 4698.0, 3176.0, 2104.0, 1439.0, 929.0, 606.0, 377.0, 261.0, 194.0, 117.0, 81.0, 62.0, 37.0, 31.0, 10.0, 16.0, 9.0, 6.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.533203125, -2.45074462890625, -2.3682861328125, -2.28582763671875, -2.203369140625, -2.12091064453125, -2.0384521484375, -1.95599365234375, -1.87353515625, -1.79107666015625, -1.7086181640625, -1.62615966796875, -1.543701171875, -1.46124267578125, -1.3787841796875, -1.29632568359375, -1.2138671875, -1.13140869140625, -1.0489501953125, -0.96649169921875, -0.884033203125, -0.80157470703125, -0.7191162109375, -0.63665771484375, -0.55419921875, -0.47174072265625, -0.3892822265625, -0.30682373046875, -0.224365234375, -0.14190673828125, -0.0594482421875, 0.02301025390625, 0.10546875, 0.18792724609375, 0.2703857421875, 0.35284423828125, 0.435302734375, 0.51776123046875, 0.6002197265625, 0.68267822265625, 0.76513671875, 0.84759521484375, 0.9300537109375, 1.01251220703125, 1.094970703125, 1.17742919921875, 1.2598876953125, 1.34234619140625, 1.4248046875, 1.50726318359375, 1.5897216796875, 1.67218017578125, 1.754638671875, 1.83709716796875, 1.9195556640625, 2.00201416015625, 2.08447265625, 2.16693115234375, 2.2493896484375, 2.33184814453125, 2.414306640625, 2.49676513671875, 2.5792236328125, 2.66168212890625, 2.744140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 8.0, 7.0, 12.0, 12.0, 15.0, 13.0, 28.0, 17.0, 35.0, 30.0, 41.0, 40.0, 47.0, 40.0, 53.0, 51.0, 59.0, 52.0, 39.0, 48.0, 36.0, 51.0, 42.0, 33.0, 38.0, 24.0, 23.0, 19.0, 15.0, 14.0, 6.0, 12.0, 6.0, 6.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8896484375, -1.8302001953125, -1.770751953125, -1.7113037109375, -1.65185546875, -1.5924072265625, -1.532958984375, -1.4735107421875, -1.4140625, -1.3546142578125, -1.295166015625, -1.2357177734375, -1.17626953125, -1.1168212890625, -1.057373046875, -0.9979248046875, -0.9384765625, -0.8790283203125, -0.819580078125, -0.7601318359375, -0.70068359375, -0.6412353515625, -0.581787109375, -0.5223388671875, -0.462890625, -0.4034423828125, -0.343994140625, -0.2845458984375, -0.22509765625, -0.1656494140625, -0.106201171875, -0.0467529296875, 0.0126953125, 0.0721435546875, 0.131591796875, 0.1910400390625, 0.25048828125, 0.3099365234375, 0.369384765625, 0.4288330078125, 0.48828125, 0.5477294921875, 0.607177734375, 0.6666259765625, 0.72607421875, 0.7855224609375, 0.844970703125, 0.9044189453125, 0.9638671875, 1.0233154296875, 1.082763671875, 1.1422119140625, 1.20166015625, 1.2611083984375, 1.320556640625, 1.3800048828125, 1.439453125, 1.4989013671875, 1.558349609375, 1.6177978515625, 1.67724609375, 1.7366943359375, 1.796142578125, 1.8555908203125, 1.9150390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 12.0, 3.0, 8.0, 11.0, 31.0, 30.0, 61.0, 79.0, 116.0, 159.0, 328.0, 598.0, 1218.0, 2530.0, 5846.0, 15134.0, 44435.0, 223876.0, 578253.0, 125233.0, 30799.0, 11044.0, 4578.0, 1995.0, 972.0, 510.0, 269.0, 149.0, 93.0, 56.0, 36.0, 26.0, 19.0, 10.0, 12.0, 9.0, 10.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.12554931640625, -4.9620361328125, -4.79852294921875, -4.635009765625, -4.47149658203125, -4.3079833984375, -4.14447021484375, -3.98095703125, -3.81744384765625, -3.6539306640625, -3.49041748046875, -3.326904296875, -3.16339111328125, -2.9998779296875, -2.83636474609375, -2.6728515625, -2.50933837890625, -2.3458251953125, -2.18231201171875, -2.018798828125, -1.85528564453125, -1.6917724609375, -1.52825927734375, -1.36474609375, -1.20123291015625, -1.0377197265625, -0.87420654296875, -0.710693359375, -0.54718017578125, -0.3836669921875, -0.22015380859375, -0.056640625, 0.10687255859375, 0.2703857421875, 0.43389892578125, 0.597412109375, 0.76092529296875, 0.9244384765625, 1.08795166015625, 1.25146484375, 1.41497802734375, 1.5784912109375, 1.74200439453125, 1.905517578125, 2.06903076171875, 2.2325439453125, 2.39605712890625, 2.5595703125, 2.72308349609375, 2.8865966796875, 3.05010986328125, 3.213623046875, 3.37713623046875, 3.5406494140625, 3.70416259765625, 3.86767578125, 4.03118896484375, 4.1947021484375, 4.35821533203125, 4.521728515625, 4.68524169921875, 4.8487548828125, 5.01226806640625, 5.17578125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 8.0, 7.0, 8.0, 9.0, 16.0, 20.0, 16.0, 25.0, 28.0, 30.0, 28.0, 35.0, 36.0, 40.0, 61.0, 33.0, 42.0, 53.0, 42.0, 54.0, 47.0, 31.0, 26.0, 40.0, 35.0, 34.0, 21.0, 25.0, 21.0, 25.0, 16.0, 14.0, 15.0, 16.0, 5.0, 5.0, 9.0, 2.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.51171875, -6.3167724609375, -6.121826171875, -5.9268798828125, -5.73193359375, -5.5369873046875, -5.342041015625, -5.1470947265625, -4.9521484375, -4.7572021484375, -4.562255859375, -4.3673095703125, -4.17236328125, -3.9774169921875, -3.782470703125, -3.5875244140625, -3.392578125, -3.1976318359375, -3.002685546875, -2.8077392578125, -2.61279296875, -2.4178466796875, -2.222900390625, -2.0279541015625, -1.8330078125, -1.6380615234375, -1.443115234375, -1.2481689453125, -1.05322265625, -0.8582763671875, -0.663330078125, -0.4683837890625, -0.2734375, -0.0784912109375, 0.116455078125, 0.3114013671875, 0.50634765625, 0.7012939453125, 0.896240234375, 1.0911865234375, 1.2861328125, 1.4810791015625, 1.676025390625, 1.8709716796875, 2.06591796875, 2.2608642578125, 2.455810546875, 2.6507568359375, 2.845703125, 3.0406494140625, 3.235595703125, 3.4305419921875, 3.62548828125, 3.8204345703125, 4.015380859375, 4.2103271484375, 4.4052734375, 4.6002197265625, 4.795166015625, 4.9901123046875, 5.18505859375, 5.3800048828125, 5.574951171875, 5.7698974609375, 5.96484375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 3.0, 12.0, 18.0, 29.0, 40.0, 50.0, 68.0, 93.0, 154.0, 249.0, 331.0, 594.0, 994.0, 1680.0, 2938.0, 5127.0, 9730.0, 19399.0, 43383.0, 114623.0, 323268.0, 324858.0, 115857.0, 43518.0, 19307.0, 9658.0, 5197.0, 2959.0, 1641.0, 1061.0, 595.0, 395.0, 240.0, 134.0, 102.0, 69.0, 42.0, 32.0, 31.0, 22.0, 12.0, 12.0, 8.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0], "bins": [-1.3828125, -1.3433074951171875, -1.303802490234375, -1.2642974853515625, -1.22479248046875, -1.1852874755859375, -1.145782470703125, -1.1062774658203125, -1.0667724609375, -1.0272674560546875, -0.987762451171875, -0.9482574462890625, -0.90875244140625, -0.8692474365234375, -0.829742431640625, -0.7902374267578125, -0.750732421875, -0.7112274169921875, -0.671722412109375, -0.6322174072265625, -0.59271240234375, -0.5532073974609375, -0.513702392578125, -0.4741973876953125, -0.4346923828125, -0.3951873779296875, -0.355682373046875, -0.3161773681640625, -0.27667236328125, -0.2371673583984375, -0.197662353515625, -0.1581573486328125, -0.11865234375, -0.0791473388671875, -0.039642333984375, -0.0001373291015625, 0.03936767578125, 0.0788726806640625, 0.118377685546875, 0.1578826904296875, 0.1973876953125, 0.2368927001953125, 0.276397705078125, 0.3159027099609375, 0.35540771484375, 0.3949127197265625, 0.434417724609375, 0.4739227294921875, 0.513427734375, 0.5529327392578125, 0.592437744140625, 0.6319427490234375, 0.67144775390625, 0.7109527587890625, 0.750457763671875, 0.7899627685546875, 0.8294677734375, 0.8689727783203125, 0.908477783203125, 0.9479827880859375, 0.98748779296875, 1.0269927978515625, 1.066497802734375, 1.1060028076171875, 1.1455078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 6.0, 3.0, 7.0, 6.0, 7.0, 18.0, 19.0, 26.0, 28.0, 52.0, 82.0, 150.0, 139.0, 146.0, 92.0, 57.0, 32.0, 26.0, 23.0, 17.0, 13.0, 10.0, 11.0, 7.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004892349243164062, -0.0004732981324195862, -0.0004573613405227661, -0.00044142454862594604, -0.000425487756729126, -0.0004095509648323059, -0.00039361417293548584, -0.00037767738103866577, -0.0003617405891418457, -0.00034580379724502563, -0.00032986700534820557, -0.0003139302134513855, -0.00029799342155456543, -0.00028205662965774536, -0.0002661198377609253, -0.0002501830458641052, -0.00023424625396728516, -0.0002183094620704651, -0.00020237267017364502, -0.00018643587827682495, -0.00017049908638000488, -0.00015456229448318481, -0.00013862550258636475, -0.00012268871068954468, -0.00010675191879272461, -9.081512689590454e-05, -7.487833499908447e-05, -5.8941543102264404e-05, -4.3004751205444336e-05, -2.7067959308624268e-05, -1.11311674118042e-05, 4.805624485015869e-06, 2.0742416381835938e-05, 3.6679208278656006e-05, 5.2616000175476074e-05, 6.855279207229614e-05, 8.448958396911621e-05, 0.00010042637586593628, 0.00011636316776275635, 0.00013229995965957642, 0.00014823675155639648, 0.00016417354345321655, 0.00018011033535003662, 0.0001960471272468567, 0.00021198391914367676, 0.00022792071104049683, 0.0002438575029373169, 0.00025979429483413696, 0.00027573108673095703, 0.0002916678786277771, 0.00030760467052459717, 0.00032354146242141724, 0.0003394782543182373, 0.0003554150462150574, 0.00037135183811187744, 0.0003872886300086975, 0.0004032254219055176, 0.00041916221380233765, 0.0004350990056991577, 0.0004510357975959778, 0.00046697258949279785, 0.0004829093813896179, 0.000498846173286438, 0.0005147829651832581, 0.0005307197570800781]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 8.0, 12.0, 7.0, 2.0, 5.0, 9.0, 19.0, 19.0, 27.0, 35.0, 60.0, 85.0, 96.0, 151.0, 236.0, 382.0, 642.0, 1156.0, 2094.0, 4032.0, 8183.0, 17422.0, 40398.0, 102718.0, 272051.0, 344538.0, 151655.0, 56521.0, 23721.0, 10750.0, 5341.0, 2652.0, 1359.0, 775.0, 446.0, 293.0, 203.0, 128.0, 70.0, 79.0, 45.0, 38.0, 26.0, 16.0, 16.0, 12.0, 8.0, 8.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0595703125, -1.0232696533203125, -0.986968994140625, -0.9506683349609375, -0.91436767578125, -0.8780670166015625, -0.841766357421875, -0.8054656982421875, -0.7691650390625, -0.7328643798828125, -0.696563720703125, -0.6602630615234375, -0.62396240234375, -0.5876617431640625, -0.551361083984375, -0.5150604248046875, -0.478759765625, -0.4424591064453125, -0.406158447265625, -0.3698577880859375, -0.33355712890625, -0.2972564697265625, -0.260955810546875, -0.2246551513671875, -0.1883544921875, -0.1520538330078125, -0.115753173828125, -0.0794525146484375, -0.04315185546875, -0.0068511962890625, 0.029449462890625, 0.0657501220703125, 0.10205078125, 0.1383514404296875, 0.174652099609375, 0.2109527587890625, 0.24725341796875, 0.2835540771484375, 0.319854736328125, 0.3561553955078125, 0.3924560546875, 0.4287567138671875, 0.465057373046875, 0.5013580322265625, 0.53765869140625, 0.5739593505859375, 0.610260009765625, 0.6465606689453125, 0.682861328125, 0.7191619873046875, 0.755462646484375, 0.7917633056640625, 0.82806396484375, 0.8643646240234375, 0.900665283203125, 0.9369659423828125, 0.9732666015625, 1.0095672607421875, 1.045867919921875, 1.0821685791015625, 1.11846923828125, 1.1547698974609375, 1.191070556640625, 1.2273712158203125, 1.263671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 4.0, 6.0, 4.0, 4.0, 5.0, 12.0, 17.0, 16.0, 23.0, 35.0, 23.0, 39.0, 64.0, 50.0, 75.0, 90.0, 80.0, 75.0, 80.0, 63.0, 57.0, 43.0, 26.0, 33.0, 22.0, 15.0, 8.0, 10.0, 6.0, 1.0, 5.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8154296875, -1.7667388916015625, -1.718048095703125, -1.6693572998046875, -1.62066650390625, -1.5719757080078125, -1.523284912109375, -1.4745941162109375, -1.4259033203125, -1.3772125244140625, -1.328521728515625, -1.2798309326171875, -1.23114013671875, -1.1824493408203125, -1.133758544921875, -1.0850677490234375, -1.036376953125, -0.9876861572265625, -0.938995361328125, -0.8903045654296875, -0.84161376953125, -0.7929229736328125, -0.744232177734375, -0.6955413818359375, -0.6468505859375, -0.5981597900390625, -0.549468994140625, -0.5007781982421875, -0.45208740234375, -0.4033966064453125, -0.354705810546875, -0.3060150146484375, -0.25732421875, -0.2086334228515625, -0.159942626953125, -0.1112518310546875, -0.06256103515625, -0.0138702392578125, 0.034820556640625, 0.0835113525390625, 0.1322021484375, 0.1808929443359375, 0.229583740234375, 0.2782745361328125, 0.32696533203125, 0.3756561279296875, 0.424346923828125, 0.4730377197265625, 0.521728515625, 0.5704193115234375, 0.619110107421875, 0.6678009033203125, 0.71649169921875, 0.7651824951171875, 0.813873291015625, 0.8625640869140625, 0.9112548828125, 0.9599456787109375, 1.008636474609375, 1.0573272705078125, 1.10601806640625, 1.1547088623046875, 1.203399658203125, 1.2520904541015625, 1.30078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 12.0, 23.0, 52.0, 117.0, 211.0, 226.0, 167.0, 110.0, 53.0, 14.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.001815795898438, -21.930543899536133, -20.859270095825195, -19.78799819946289, -18.716724395751953, -17.64545249938965, -16.574180603027344, -15.502907752990723, -14.431634902954102, -13.36036205291748, -12.28908920288086, -11.217817306518555, -10.146544456481934, -9.075271606445312, -8.003999710083008, -6.932726860046387, -5.861454010009766, -4.7901811599731445, -3.7189087867736816, -2.6476361751556396, -1.5763635635375977, -0.5050907135009766, 0.5661816596984863, 1.6374540328979492, 2.7087268829345703, 3.7799994945526123, 4.851272106170654, 5.922544479370117, 6.993817329406738, 8.06509017944336, 9.136362075805664, 10.207634925842285, 11.278911590576172, 12.350184440612793, 13.421457290649414, 14.492729187011719, 15.56400203704834, 16.63527488708496, 17.706546783447266, 18.777820587158203, 19.849092483520508, 20.920364379882812, 21.99163818359375, 23.062910079956055, 24.13418197631836, 25.205455780029297, 26.2767276763916, 27.347999572753906, 28.419273376464844, 29.49054527282715, 30.561819076538086, 31.63309097290039, 32.70436477661133, 33.775634765625, 34.84690856933594, 35.918182373046875, 36.98945617675781, 38.06072998046875, 39.13199996948242, 40.20327377319336, 41.2745475769043, 42.34581756591797, 43.417091369628906, 44.488365173339844, 45.559635162353516]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 6.0, 9.0, 16.0, 14.0, 16.0, 11.0, 23.0, 29.0, 27.0, 35.0, 29.0, 44.0, 38.0, 29.0, 43.0, 37.0, 45.0, 40.0, 38.0, 33.0, 41.0, 41.0, 39.0, 43.0, 33.0, 37.0, 31.0, 28.0, 13.0, 21.0, 14.0, 15.0, 15.0, 10.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.081348419189453, -12.653268814086914, -12.225190162658691, -11.797110557556152, -11.36903190612793, -10.94095230102539, -10.512872695922852, -10.084793090820312, -9.65671443939209, -9.22863483428955, -8.800556182861328, -8.372476577758789, -7.944397449493408, -7.516318321228027, -7.088238716125488, -6.660159587860107, -6.232080459594727, -5.804001331329346, -5.375922203063965, -4.947842597961426, -4.519763469696045, -4.091684341430664, -3.663604974746704, -3.235525608062744, -2.8074464797973633, -2.3793673515319824, -1.9512879848480225, -1.523208737373352, -1.0951294898986816, -0.6670503616333008, -0.23897099494934082, 0.18910837173461914, 0.6171884536743164, 1.0452677011489868, 1.4733469486236572, 1.9014261960983276, 2.329505443572998, 2.757584571838379, 3.185663938522339, 3.613743305206299, 4.04182243347168, 4.4699015617370605, 4.897980690002441, 5.3260602951049805, 5.754139423370361, 6.182218551635742, 6.610298156738281, 7.038377285003662, 7.466456413269043, 7.894535541534424, 8.322614669799805, 8.750694274902344, 9.178773880004883, 9.606852531433105, 10.034932136535645, 10.463010787963867, 10.891090393066406, 11.319169998168945, 11.747248649597168, 12.175328254699707, 12.60340690612793, 13.031486511230469, 13.459566116333008, 13.887645721435547, 14.31572437286377]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 10.0, 17.0, 23.0, 38.0, 54.0, 75.0, 112.0, 154.0, 265.0, 405.0, 716.0, 1017.0, 1690.0, 2847.0, 4659.0, 8115.0, 13802.0, 24665.0, 45994.0, 89806.0, 188393.0, 433913.0, 961041.0, 1208154.0, 660448.0, 279040.0, 125636.0, 62998.0, 33512.0, 18735.0, 10764.0, 6504.0, 3866.0, 2464.0, 1519.0, 970.0, 638.0, 401.0, 261.0, 195.0, 117.0, 78.0, 52.0, 30.0, 35.0, 13.0, 16.0, 7.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.60546875, -1.5540924072265625, -1.502716064453125, -1.4513397216796875, -1.39996337890625, -1.3485870361328125, -1.297210693359375, -1.2458343505859375, -1.1944580078125, -1.1430816650390625, -1.091705322265625, -1.0403289794921875, -0.98895263671875, -0.9375762939453125, -0.886199951171875, -0.8348236083984375, -0.783447265625, -0.7320709228515625, -0.680694580078125, -0.6293182373046875, -0.57794189453125, -0.5265655517578125, -0.475189208984375, -0.4238128662109375, -0.3724365234375, -0.3210601806640625, -0.269683837890625, -0.2183074951171875, -0.16693115234375, -0.1155548095703125, -0.064178466796875, -0.0128021240234375, 0.03857421875, 0.0899505615234375, 0.141326904296875, 0.1927032470703125, 0.24407958984375, 0.2954559326171875, 0.346832275390625, 0.3982086181640625, 0.4495849609375, 0.5009613037109375, 0.552337646484375, 0.6037139892578125, 0.65509033203125, 0.7064666748046875, 0.757843017578125, 0.8092193603515625, 0.860595703125, 0.9119720458984375, 0.963348388671875, 1.0147247314453125, 1.06610107421875, 1.1174774169921875, 1.168853759765625, 1.2202301025390625, 1.2716064453125, 1.3229827880859375, 1.374359130859375, 1.4257354736328125, 1.47711181640625, 1.5284881591796875, 1.579864501953125, 1.6312408447265625, 1.6826171875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 5.0, 2.0, 3.0, 6.0, 7.0, 13.0, 3.0, 10.0, 6.0, 11.0, 15.0, 21.0, 24.0, 21.0, 24.0, 35.0, 29.0, 35.0, 36.0, 39.0, 33.0, 37.0, 51.0, 37.0, 43.0, 43.0, 44.0, 37.0, 35.0, 38.0, 40.0, 33.0, 16.0, 23.0, 26.0, 14.0, 18.0, 22.0, 11.0, 15.0, 4.0, 13.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4990234375, -1.44525146484375, -1.3914794921875, -1.33770751953125, -1.283935546875, -1.23016357421875, -1.1763916015625, -1.12261962890625, -1.06884765625, -1.01507568359375, -0.9613037109375, -0.90753173828125, -0.853759765625, -0.79998779296875, -0.7462158203125, -0.69244384765625, -0.638671875, -0.58489990234375, -0.5311279296875, -0.47735595703125, -0.423583984375, -0.36981201171875, -0.3160400390625, -0.26226806640625, -0.20849609375, -0.15472412109375, -0.1009521484375, -0.04718017578125, 0.006591796875, 0.06036376953125, 0.1141357421875, 0.16790771484375, 0.2216796875, 0.27545166015625, 0.3292236328125, 0.38299560546875, 0.436767578125, 0.49053955078125, 0.5443115234375, 0.59808349609375, 0.65185546875, 0.70562744140625, 0.7593994140625, 0.81317138671875, 0.866943359375, 0.92071533203125, 0.9744873046875, 1.02825927734375, 1.08203125, 1.13580322265625, 1.1895751953125, 1.24334716796875, 1.297119140625, 1.35089111328125, 1.4046630859375, 1.45843505859375, 1.51220703125, 1.56597900390625, 1.6197509765625, 1.67352294921875, 1.727294921875, 1.78106689453125, 1.8348388671875, 1.88861083984375, 1.9423828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 11.0, 35.0, 48.0, 61.0, 122.0, 210.0, 402.0, 852.0, 2305.0, 8103.0, 40292.0, 282305.0, 2805968.0, 928109.0, 102062.0, 16918.0, 3991.0, 1237.0, 556.0, 294.0, 159.0, 96.0, 48.0, 27.0, 21.0, 11.0, 12.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.859375, -5.66241455078125, -5.4654541015625, -5.26849365234375, -5.071533203125, -4.87457275390625, -4.6776123046875, -4.48065185546875, -4.28369140625, -4.08673095703125, -3.8897705078125, -3.69281005859375, -3.495849609375, -3.29888916015625, -3.1019287109375, -2.90496826171875, -2.7080078125, -2.51104736328125, -2.3140869140625, -2.11712646484375, -1.920166015625, -1.72320556640625, -1.5262451171875, -1.32928466796875, -1.13232421875, -0.93536376953125, -0.7384033203125, -0.54144287109375, -0.344482421875, -0.14752197265625, 0.0494384765625, 0.24639892578125, 0.443359375, 0.64031982421875, 0.8372802734375, 1.03424072265625, 1.231201171875, 1.42816162109375, 1.6251220703125, 1.82208251953125, 2.01904296875, 2.21600341796875, 2.4129638671875, 2.60992431640625, 2.806884765625, 3.00384521484375, 3.2008056640625, 3.39776611328125, 3.5947265625, 3.79168701171875, 3.9886474609375, 4.18560791015625, 4.382568359375, 4.57952880859375, 4.7764892578125, 4.97344970703125, 5.17041015625, 5.36737060546875, 5.5643310546875, 5.76129150390625, 5.958251953125, 6.15521240234375, 6.3521728515625, 6.54913330078125, 6.74609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 16.0, 26.0, 20.0, 38.0, 68.0, 117.0, 148.0, 268.0, 463.0, 789.0, 858.0, 490.0, 286.0, 172.0, 115.0, 76.0, 44.0, 24.0, 16.0, 12.0, 4.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3125, -7.1038818359375, -6.895263671875, -6.6866455078125, -6.47802734375, -6.2694091796875, -6.060791015625, -5.8521728515625, -5.6435546875, -5.4349365234375, -5.226318359375, -5.0177001953125, -4.80908203125, -4.6004638671875, -4.391845703125, -4.1832275390625, -3.974609375, -3.7659912109375, -3.557373046875, -3.3487548828125, -3.14013671875, -2.9315185546875, -2.722900390625, -2.5142822265625, -2.3056640625, -2.0970458984375, -1.888427734375, -1.6798095703125, -1.47119140625, -1.2625732421875, -1.053955078125, -0.8453369140625, -0.63671875, -0.4281005859375, -0.219482421875, -0.0108642578125, 0.19775390625, 0.4063720703125, 0.614990234375, 0.8236083984375, 1.0322265625, 1.2408447265625, 1.449462890625, 1.6580810546875, 1.86669921875, 2.0753173828125, 2.283935546875, 2.4925537109375, 2.701171875, 2.9097900390625, 3.118408203125, 3.3270263671875, 3.53564453125, 3.7442626953125, 3.952880859375, 4.1614990234375, 4.3701171875, 4.5787353515625, 4.787353515625, 4.9959716796875, 5.20458984375, 5.4132080078125, 5.621826171875, 5.8304443359375, 6.0390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 12.0, 22.0, 64.0, 146.0, 255.0, 253.0, 159.0, 59.0, 21.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.74494934082031, -74.0639419555664, -72.3829345703125, -70.7019271850586, -69.02091979980469, -67.33991241455078, -65.65890502929688, -63.97789764404297, -62.29689025878906, -60.615882873535156, -58.93487548828125, -57.253868103027344, -55.57286071777344, -53.89185333251953, -52.210845947265625, -50.52983856201172, -48.84882736206055, -47.16781997680664, -45.486812591552734, -43.80580520629883, -42.12479782104492, -40.443790435791016, -38.762779235839844, -37.08177185058594, -35.40076446533203, -33.719757080078125, -32.03874969482422, -30.357742309570312, -28.676734924316406, -26.9957275390625, -25.31471824645996, -23.633710861206055, -21.95270347595215, -20.271696090698242, -18.590688705444336, -16.909679412841797, -15.228672981262207, -13.5476655960083, -11.866657257080078, -10.185649871826172, -8.504642486572266, -6.823635101318359, -5.142627239227295, -3.4616193771362305, -1.7806119918823242, -0.09960460662841797, 1.5814037322998047, 3.262411117553711, 4.943418502807617, 6.624425888061523, 8.30543327331543, 9.986441612243652, 11.667448997497559, 13.348456382751465, 15.029464721679688, 16.710472106933594, 18.3914794921875, 20.072486877441406, 21.753494262695312, 23.43450164794922, 25.115509033203125, 26.79651641845703, 28.47752571105957, 30.158533096313477, 31.839540481567383]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 9.0, 6.0, 5.0, 11.0, 17.0, 13.0, 19.0, 25.0, 29.0, 40.0, 29.0, 36.0, 36.0, 37.0, 48.0, 56.0, 44.0, 50.0, 52.0, 63.0, 55.0, 44.0, 41.0, 26.0, 48.0, 26.0, 28.0, 17.0, 9.0, 16.0, 14.0, 9.0, 8.0, 11.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.41199493408203, -15.853789329528809, -15.295584678649902, -14.73737907409668, -14.179174423217773, -13.62096881866455, -13.062763214111328, -12.504558563232422, -11.9463529586792, -11.388147354125977, -10.82994270324707, -10.271737098693848, -9.713531494140625, -9.155326843261719, -8.597121238708496, -8.038915634155273, -7.480710983276367, -6.922505855560303, -6.364300727844238, -5.806095123291016, -5.247889995574951, -4.689684867858887, -4.131479263305664, -3.5732741355895996, -3.015069007873535, -2.4568638801574707, -1.8986585140228271, -1.3404532670974731, -0.7822480201721191, -0.2240428924560547, 0.33416247367858887, 0.8923678398132324, 1.4505748748779297, 2.008780002593994, 2.5669853687286377, 3.1251907348632812, 3.6833958625793457, 4.24160099029541, 4.799806594848633, 5.358011722564697, 5.916216850280762, 6.474421977996826, 7.032627105712891, 7.590832710266113, 8.149038314819336, 8.707242965698242, 9.265448570251465, 9.823654174804688, 10.381858825683594, 10.940064430236816, 11.498269081115723, 12.056474685668945, 12.614679336547852, 13.172884941101074, 13.731090545654297, 14.289295196533203, 14.847500801086426, 15.405706405639648, 15.963911056518555, 16.52211570739746, 17.080322265625, 17.638526916503906, 18.196731567382812, 18.75493812561035, 19.313142776489258]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 7.0, 5.0, 3.0, 4.0, 8.0, 21.0, 14.0, 26.0, 35.0, 84.0, 119.0, 186.0, 285.0, 422.0, 716.0, 1098.0, 1915.0, 3190.0, 5063.0, 8157.0, 13365.0, 22283.0, 41961.0, 97821.0, 248287.0, 318069.0, 152764.0, 59854.0, 29369.0, 16924.0, 10356.0, 6238.0, 3712.0, 2283.0, 1446.0, 931.0, 547.0, 357.0, 221.0, 148.0, 95.0, 58.0, 45.0, 31.0, 17.0, 10.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.798828125, -2.714599609375, -2.63037109375, -2.546142578125, -2.4619140625, -2.377685546875, -2.29345703125, -2.209228515625, -2.125, -2.040771484375, -1.95654296875, -1.872314453125, -1.7880859375, -1.703857421875, -1.61962890625, -1.535400390625, -1.451171875, -1.366943359375, -1.28271484375, -1.198486328125, -1.1142578125, -1.030029296875, -0.94580078125, -0.861572265625, -0.77734375, -0.693115234375, -0.60888671875, -0.524658203125, -0.4404296875, -0.356201171875, -0.27197265625, -0.187744140625, -0.103515625, -0.019287109375, 0.06494140625, 0.149169921875, 0.2333984375, 0.317626953125, 0.40185546875, 0.486083984375, 0.5703125, 0.654541015625, 0.73876953125, 0.822998046875, 0.9072265625, 0.991455078125, 1.07568359375, 1.159912109375, 1.244140625, 1.328369140625, 1.41259765625, 1.496826171875, 1.5810546875, 1.665283203125, 1.74951171875, 1.833740234375, 1.91796875, 2.002197265625, 2.08642578125, 2.170654296875, 2.2548828125, 2.339111328125, 2.42333984375, 2.507568359375, 2.591796875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 11.0, 9.0, 8.0, 22.0, 21.0, 20.0, 17.0, 27.0, 34.0, 21.0, 33.0, 33.0, 43.0, 34.0, 38.0, 54.0, 52.0, 65.0, 50.0, 42.0, 37.0, 45.0, 29.0, 26.0, 31.0, 40.0, 21.0, 20.0, 16.0, 16.0, 11.0, 19.0, 11.0, 7.0, 7.0, 9.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.9697265625, -1.9087677001953125, -1.847808837890625, -1.7868499755859375, -1.72589111328125, -1.6649322509765625, -1.603973388671875, -1.5430145263671875, -1.4820556640625, -1.4210968017578125, -1.360137939453125, -1.2991790771484375, -1.23822021484375, -1.1772613525390625, -1.116302490234375, -1.0553436279296875, -0.994384765625, -0.9334259033203125, -0.872467041015625, -0.8115081787109375, -0.75054931640625, -0.6895904541015625, -0.628631591796875, -0.5676727294921875, -0.5067138671875, -0.4457550048828125, -0.384796142578125, -0.3238372802734375, -0.26287841796875, -0.2019195556640625, -0.140960693359375, -0.0800018310546875, -0.01904296875, 0.0419158935546875, 0.102874755859375, 0.1638336181640625, 0.22479248046875, 0.2857513427734375, 0.346710205078125, 0.4076690673828125, 0.4686279296875, 0.5295867919921875, 0.590545654296875, 0.6515045166015625, 0.71246337890625, 0.7734222412109375, 0.834381103515625, 0.8953399658203125, 0.956298828125, 1.0172576904296875, 1.078216552734375, 1.1391754150390625, 1.20013427734375, 1.2610931396484375, 1.322052001953125, 1.3830108642578125, 1.4439697265625, 1.5049285888671875, 1.565887451171875, 1.6268463134765625, 1.68780517578125, 1.7487640380859375, 1.809722900390625, 1.8706817626953125, 1.931640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 5.0, 7.0, 11.0, 14.0, 22.0, 31.0, 38.0, 41.0, 87.0, 130.0, 220.0, 472.0, 918.0, 1923.0, 5113.0, 14841.0, 46004.0, 227565.0, 572259.0, 129576.0, 31642.0, 10671.0, 3842.0, 1552.0, 693.0, 355.0, 182.0, 127.0, 62.0, 44.0, 31.0, 21.0, 24.0, 11.0, 10.0, 2.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.53253173828125, -5.3502197265625, -5.16790771484375, -4.985595703125, -4.80328369140625, -4.6209716796875, -4.43865966796875, -4.25634765625, -4.07403564453125, -3.8917236328125, -3.70941162109375, -3.527099609375, -3.34478759765625, -3.1624755859375, -2.98016357421875, -2.7978515625, -2.61553955078125, -2.4332275390625, -2.25091552734375, -2.068603515625, -1.88629150390625, -1.7039794921875, -1.52166748046875, -1.33935546875, -1.15704345703125, -0.9747314453125, -0.79241943359375, -0.610107421875, -0.42779541015625, -0.2454833984375, -0.06317138671875, 0.119140625, 0.30145263671875, 0.4837646484375, 0.66607666015625, 0.848388671875, 1.03070068359375, 1.2130126953125, 1.39532470703125, 1.57763671875, 1.75994873046875, 1.9422607421875, 2.12457275390625, 2.306884765625, 2.48919677734375, 2.6715087890625, 2.85382080078125, 3.0361328125, 3.21844482421875, 3.4007568359375, 3.58306884765625, 3.765380859375, 3.94769287109375, 4.1300048828125, 4.31231689453125, 4.49462890625, 4.67694091796875, 4.8592529296875, 5.04156494140625, 5.223876953125, 5.40618896484375, 5.5885009765625, 5.77081298828125, 5.953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 12.0, 10.0, 10.0, 8.0, 10.0, 23.0, 17.0, 21.0, 34.0, 30.0, 41.0, 27.0, 38.0, 43.0, 45.0, 55.0, 47.0, 50.0, 41.0, 55.0, 51.0, 49.0, 43.0, 17.0, 34.0, 36.0, 40.0, 20.0, 23.0, 13.0, 13.0, 7.0, 6.0, 6.0, 6.0, 7.0, 1.0, 6.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.74609375, -6.53863525390625, -6.3311767578125, -6.12371826171875, -5.916259765625, -5.70880126953125, -5.5013427734375, -5.29388427734375, -5.08642578125, -4.87896728515625, -4.6715087890625, -4.46405029296875, -4.256591796875, -4.04913330078125, -3.8416748046875, -3.63421630859375, -3.4267578125, -3.21929931640625, -3.0118408203125, -2.80438232421875, -2.596923828125, -2.38946533203125, -2.1820068359375, -1.97454833984375, -1.76708984375, -1.55963134765625, -1.3521728515625, -1.14471435546875, -0.937255859375, -0.72979736328125, -0.5223388671875, -0.31488037109375, -0.107421875, 0.10003662109375, 0.3074951171875, 0.51495361328125, 0.722412109375, 0.92987060546875, 1.1373291015625, 1.34478759765625, 1.55224609375, 1.75970458984375, 1.9671630859375, 2.17462158203125, 2.382080078125, 2.58953857421875, 2.7969970703125, 3.00445556640625, 3.2119140625, 3.41937255859375, 3.6268310546875, 3.83428955078125, 4.041748046875, 4.24920654296875, 4.4566650390625, 4.66412353515625, 4.87158203125, 5.07904052734375, 5.2864990234375, 5.49395751953125, 5.701416015625, 5.90887451171875, 6.1163330078125, 6.32379150390625, 6.53125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 11.0, 13.0, 19.0, 30.0, 44.0, 79.0, 99.0, 200.0, 330.0, 555.0, 1043.0, 1877.0, 3304.0, 5924.0, 11196.0, 22537.0, 55347.0, 165963.0, 385045.0, 250420.0, 82625.0, 30655.0, 14369.0, 7565.0, 4160.0, 2220.0, 1226.0, 704.0, 396.0, 254.0, 136.0, 69.0, 54.0, 30.0, 19.0, 11.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.396270751953125, -1.35601806640625, -1.315765380859375, -1.2755126953125, -1.235260009765625, -1.19500732421875, -1.154754638671875, -1.114501953125, -1.074249267578125, -1.03399658203125, -0.993743896484375, -0.9534912109375, -0.913238525390625, -0.87298583984375, -0.832733154296875, -0.79248046875, -0.752227783203125, -0.71197509765625, -0.671722412109375, -0.6314697265625, -0.591217041015625, -0.55096435546875, -0.510711669921875, -0.470458984375, -0.430206298828125, -0.38995361328125, -0.349700927734375, -0.3094482421875, -0.269195556640625, -0.22894287109375, -0.188690185546875, -0.1484375, -0.108184814453125, -0.06793212890625, -0.027679443359375, 0.0125732421875, 0.052825927734375, 0.09307861328125, 0.133331298828125, 0.173583984375, 0.213836669921875, 0.25408935546875, 0.294342041015625, 0.3345947265625, 0.374847412109375, 0.41510009765625, 0.455352783203125, 0.49560546875, 0.535858154296875, 0.57611083984375, 0.616363525390625, 0.6566162109375, 0.696868896484375, 0.73712158203125, 0.777374267578125, 0.817626953125, 0.857879638671875, 0.89813232421875, 0.938385009765625, 0.9786376953125, 1.018890380859375, 1.05914306640625, 1.099395751953125, 1.1396484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 5.0, 8.0, 10.0, 15.0, 14.0, 34.0, 58.0, 70.0, 121.0, 177.0, 155.0, 110.0, 78.0, 38.0, 25.0, 21.0, 8.0, 11.0, 5.0, 9.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006437301635742188, -0.000625312328338623, -0.0006068944931030273, -0.0005884766578674316, -0.0005700588226318359, -0.0005516409873962402, -0.0005332231521606445, -0.0005148053169250488, -0.0004963874816894531, -0.0004779696464538574, -0.0004595518112182617, -0.000441133975982666, -0.0004227161407470703, -0.0004042983055114746, -0.0003858804702758789, -0.0003674626350402832, -0.0003490447998046875, -0.0003306269645690918, -0.0003122091293334961, -0.0002937912940979004, -0.0002753734588623047, -0.000256955623626709, -0.00023853778839111328, -0.00022011995315551758, -0.00020170211791992188, -0.00018328428268432617, -0.00016486644744873047, -0.00014644861221313477, -0.00012803077697753906, -0.00010961294174194336, -9.119510650634766e-05, -7.277727127075195e-05, -5.435943603515625e-05, -3.594160079956055e-05, -1.7523765563964844e-05, 8.940696716308594e-07, 1.9311904907226562e-05, 3.7729740142822266e-05, 5.614757537841797e-05, 7.456541061401367e-05, 9.298324584960938e-05, 0.00011140108108520508, 0.00012981891632080078, 0.00014823675155639648, 0.0001666545867919922, 0.0001850724220275879, 0.0002034902572631836, 0.0002219080924987793, 0.000240325927734375, 0.0002587437629699707, 0.0002771615982055664, 0.0002955794334411621, 0.0003139972686767578, 0.0003324151039123535, 0.0003508329391479492, 0.0003692507743835449, 0.0003876686096191406, 0.00040608644485473633, 0.00042450428009033203, 0.00044292211532592773, 0.00046133995056152344, 0.00047975778579711914, 0.0004981756210327148, 0.0005165934562683105, 0.0005350112915039062]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 7.0, 16.0, 20.0, 13.0, 36.0, 54.0, 86.0, 122.0, 174.0, 351.0, 564.0, 1249.0, 2739.0, 6444.0, 16787.0, 48440.0, 159019.0, 392907.0, 282476.0, 89576.0, 28612.0, 10572.0, 4303.0, 1966.0, 881.0, 462.0, 234.0, 165.0, 94.0, 52.0, 41.0, 24.0, 21.0, 13.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2744140625, -1.2329864501953125, -1.191558837890625, -1.1501312255859375, -1.10870361328125, -1.0672760009765625, -1.025848388671875, -0.9844207763671875, -0.9429931640625, -0.9015655517578125, -0.860137939453125, -0.8187103271484375, -0.77728271484375, -0.7358551025390625, -0.694427490234375, -0.6529998779296875, -0.611572265625, -0.5701446533203125, -0.528717041015625, -0.4872894287109375, -0.44586181640625, -0.4044342041015625, -0.363006591796875, -0.3215789794921875, -0.2801513671875, -0.2387237548828125, -0.197296142578125, -0.1558685302734375, -0.11444091796875, -0.0730133056640625, -0.031585693359375, 0.0098419189453125, 0.05126953125, 0.0926971435546875, 0.134124755859375, 0.1755523681640625, 0.21697998046875, 0.2584075927734375, 0.299835205078125, 0.3412628173828125, 0.3826904296875, 0.4241180419921875, 0.465545654296875, 0.5069732666015625, 0.54840087890625, 0.5898284912109375, 0.631256103515625, 0.6726837158203125, 0.714111328125, 0.7555389404296875, 0.796966552734375, 0.8383941650390625, 0.87982177734375, 0.9212493896484375, 0.962677001953125, 1.0041046142578125, 1.0455322265625, 1.0869598388671875, 1.128387451171875, 1.1698150634765625, 1.21124267578125, 1.2526702880859375, 1.294097900390625, 1.3355255126953125, 1.376953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 8.0, 5.0, 13.0, 18.0, 18.0, 15.0, 29.0, 35.0, 38.0, 42.0, 43.0, 51.0, 62.0, 60.0, 58.0, 58.0, 56.0, 63.0, 46.0, 48.0, 40.0, 35.0, 24.0, 19.0, 20.0, 9.0, 11.0, 5.0, 9.0, 4.0, 7.0, 5.0, 5.0, 7.0, 2.0, 6.0, 0.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98046875, -0.9474029541015625, -0.914337158203125, -0.8812713623046875, -0.84820556640625, -0.8151397705078125, -0.782073974609375, -0.7490081787109375, -0.7159423828125, -0.6828765869140625, -0.649810791015625, -0.6167449951171875, -0.58367919921875, -0.5506134033203125, -0.517547607421875, -0.4844818115234375, -0.451416015625, -0.4183502197265625, -0.385284423828125, -0.3522186279296875, -0.31915283203125, -0.2860870361328125, -0.253021240234375, -0.2199554443359375, -0.1868896484375, -0.1538238525390625, -0.120758056640625, -0.0876922607421875, -0.05462646484375, -0.0215606689453125, 0.011505126953125, 0.0445709228515625, 0.07763671875, 0.1107025146484375, 0.143768310546875, 0.1768341064453125, 0.20989990234375, 0.2429656982421875, 0.276031494140625, 0.3090972900390625, 0.3421630859375, 0.3752288818359375, 0.408294677734375, 0.4413604736328125, 0.47442626953125, 0.5074920654296875, 0.540557861328125, 0.5736236572265625, 0.606689453125, 0.6397552490234375, 0.672821044921875, 0.7058868408203125, 0.73895263671875, 0.7720184326171875, 0.805084228515625, 0.8381500244140625, 0.8712158203125, 0.9042816162109375, 0.937347412109375, 0.9704132080078125, 1.00347900390625, 1.0365447998046875, 1.069610595703125, 1.1026763916015625, 1.1357421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 19.0, 27.0, 64.0, 143.0, 148.0, 208.0, 166.0, 111.0, 50.0, 28.0, 22.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.37370491027832, -17.480655670166016, -16.587604522705078, -15.694555282592773, -14.801506042480469, -13.908456802368164, -13.015406608581543, -12.122356414794922, -11.229307174682617, -10.336257934570312, -9.443207740783691, -8.55015754699707, -7.657108306884766, -6.764058589935303, -5.87100887298584, -4.977959156036377, -4.084909439086914, -3.191859722137451, -2.2988100051879883, -1.4057602882385254, -0.5127105712890625, 0.3803391456604004, 1.2733888626098633, 2.166438579559326, 3.059488296508789, 3.952538013458252, 4.845587730407715, 5.738637447357178, 6.631687164306641, 7.5247368812561035, 8.417786598205566, 9.310836791992188, 10.203887939453125, 11.09693717956543, 11.98998737335205, 12.883037567138672, 13.776086807250977, 14.669136047363281, 15.562186241149902, 16.455236434936523, 17.348285675048828, 18.241334915161133, 19.134384155273438, 20.027435302734375, 20.92048454284668, 21.813533782958984, 22.706584930419922, 23.599634170532227, 24.49268341064453, 25.385732650756836, 26.27878189086914, 27.171833038330078, 28.064882278442383, 28.957931518554688, 29.850982666015625, 30.74403190612793, 31.637081146240234, 32.53013229370117, 33.423179626464844, 34.31623077392578, 35.20928192138672, 36.10232925415039, 36.99538040161133, 37.888427734375, 38.78147888183594]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 2.0, 11.0, 9.0, 8.0, 14.0, 14.0, 19.0, 19.0, 35.0, 33.0, 25.0, 34.0, 32.0, 44.0, 42.0, 41.0, 48.0, 46.0, 58.0, 53.0, 41.0, 33.0, 52.0, 35.0, 31.0, 30.0, 19.0, 31.0, 29.0, 13.0, 13.0, 14.0, 10.0, 6.0, 14.0, 7.0, 4.0, 6.0, 2.0, 3.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.734094619750977, -14.256233215332031, -13.778371810913086, -13.30051040649414, -12.822648048400879, -12.344786643981934, -11.866925239562988, -11.389063835144043, -10.911201477050781, -10.433340072631836, -9.95547866821289, -9.477617263793945, -8.999754905700684, -8.521893501281738, -8.044032096862793, -7.566170692443848, -7.088309288024902, -6.610447883605957, -6.1325860023498535, -5.654724597930908, -5.176862716674805, -4.699001312255859, -4.221139907836914, -3.7432782649993896, -3.2654166221618652, -2.787554979324341, -2.3096933364868164, -1.831831932067871, -1.3539702892303467, -0.8761086463928223, -0.39824724197387695, 0.07961440086364746, 0.5574769973754883, 1.0353386402130127, 1.5132001638412476, 1.9910616874694824, 2.468923330307007, 2.9467849731445312, 3.4246463775634766, 3.902508020401001, 4.380369663238525, 4.858231067657471, 5.336092948913574, 5.8139543533325195, 6.291815757751465, 6.769677639007568, 7.247539043426514, 7.725400924682617, 8.203262329101562, 8.681123733520508, 9.158985137939453, 9.636846542358398, 10.11470890045166, 10.592570304870605, 11.07043170928955, 11.548293113708496, 12.026155471801758, 12.504016876220703, 12.981878280639648, 13.459739685058594, 13.937602043151855, 14.4154634475708, 14.893324851989746, 15.371186256408691, 15.849047660827637]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 12.0, 11.0, 27.0, 36.0, 53.0, 76.0, 160.0, 260.0, 499.0, 1069.0, 2450.0, 5838.0, 15448.0, 44820.0, 146965.0, 553301.0, 1681536.0, 1262143.0, 336998.0, 93768.0, 30139.0, 10645.0, 4293.0, 1870.0, 821.0, 419.0, 224.0, 133.0, 89.0, 54.0, 45.0, 27.0, 15.0, 9.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.392578125, -2.312347412109375, -2.23211669921875, -2.151885986328125, -2.0716552734375, -1.991424560546875, -1.91119384765625, -1.830963134765625, -1.750732421875, -1.670501708984375, -1.59027099609375, -1.510040283203125, -1.4298095703125, -1.349578857421875, -1.26934814453125, -1.189117431640625, -1.10888671875, -1.028656005859375, -0.94842529296875, -0.868194580078125, -0.7879638671875, -0.707733154296875, -0.62750244140625, -0.547271728515625, -0.467041015625, -0.386810302734375, -0.30657958984375, -0.226348876953125, -0.1461181640625, -0.065887451171875, 0.01434326171875, 0.094573974609375, 0.1748046875, 0.255035400390625, 0.33526611328125, 0.415496826171875, 0.4957275390625, 0.575958251953125, 0.65618896484375, 0.736419677734375, 0.816650390625, 0.896881103515625, 0.97711181640625, 1.057342529296875, 1.1375732421875, 1.217803955078125, 1.29803466796875, 1.378265380859375, 1.45849609375, 1.538726806640625, 1.61895751953125, 1.699188232421875, 1.7794189453125, 1.859649658203125, 1.93988037109375, 2.020111083984375, 2.100341796875, 2.180572509765625, 2.26080322265625, 2.341033935546875, 2.4212646484375, 2.501495361328125, 2.58172607421875, 2.661956787109375, 2.7421875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 8.0, 10.0, 11.0, 19.0, 24.0, 30.0, 27.0, 40.0, 27.0, 37.0, 39.0, 33.0, 58.0, 54.0, 43.0, 43.0, 44.0, 45.0, 55.0, 46.0, 38.0, 34.0, 43.0, 22.0, 24.0, 28.0, 21.0, 11.0, 8.0, 10.0, 15.0, 8.0, 6.0, 7.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8388671875, -1.7763824462890625, -1.713897705078125, -1.6514129638671875, -1.58892822265625, -1.5264434814453125, -1.463958740234375, -1.4014739990234375, -1.3389892578125, -1.2765045166015625, -1.214019775390625, -1.1515350341796875, -1.08905029296875, -1.0265655517578125, -0.964080810546875, -0.9015960693359375, -0.839111328125, -0.7766265869140625, -0.714141845703125, -0.6516571044921875, -0.58917236328125, -0.5266876220703125, -0.464202880859375, -0.4017181396484375, -0.3392333984375, -0.2767486572265625, -0.214263916015625, -0.1517791748046875, -0.08929443359375, -0.0268096923828125, 0.035675048828125, 0.0981597900390625, 0.16064453125, 0.2231292724609375, 0.285614013671875, 0.3480987548828125, 0.41058349609375, 0.4730682373046875, 0.535552978515625, 0.5980377197265625, 0.6605224609375, 0.7230072021484375, 0.785491943359375, 0.8479766845703125, 0.91046142578125, 0.9729461669921875, 1.035430908203125, 1.0979156494140625, 1.160400390625, 1.2228851318359375, 1.285369873046875, 1.3478546142578125, 1.41033935546875, 1.4728240966796875, 1.535308837890625, 1.5977935791015625, 1.6602783203125, 1.7227630615234375, 1.785247802734375, 1.8477325439453125, 1.91021728515625, 1.9727020263671875, 2.035186767578125, 2.0976715087890625, 2.16015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 20.0, 33.0, 45.0, 69.0, 120.0, 235.0, 377.0, 792.0, 1653.0, 4090.0, 11856.0, 45446.0, 223942.0, 1697297.0, 1889179.0, 249072.0, 49479.0, 12681.0, 4308.0, 1774.0, 838.0, 399.0, 213.0, 135.0, 85.0, 51.0, 25.0, 18.0, 7.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.671875, -4.52130126953125, -4.3707275390625, -4.22015380859375, -4.069580078125, -3.91900634765625, -3.7684326171875, -3.61785888671875, -3.46728515625, -3.31671142578125, -3.1661376953125, -3.01556396484375, -2.864990234375, -2.71441650390625, -2.5638427734375, -2.41326904296875, -2.2626953125, -2.11212158203125, -1.9615478515625, -1.81097412109375, -1.660400390625, -1.50982666015625, -1.3592529296875, -1.20867919921875, -1.05810546875, -0.90753173828125, -0.7569580078125, -0.60638427734375, -0.455810546875, -0.30523681640625, -0.1546630859375, -0.00408935546875, 0.146484375, 0.29705810546875, 0.4476318359375, 0.59820556640625, 0.748779296875, 0.89935302734375, 1.0499267578125, 1.20050048828125, 1.35107421875, 1.50164794921875, 1.6522216796875, 1.80279541015625, 1.953369140625, 2.10394287109375, 2.2545166015625, 2.40509033203125, 2.5556640625, 2.70623779296875, 2.8568115234375, 3.00738525390625, 3.157958984375, 3.30853271484375, 3.4591064453125, 3.60968017578125, 3.76025390625, 3.91082763671875, 4.0614013671875, 4.21197509765625, 4.362548828125, 4.51312255859375, 4.6636962890625, 4.81427001953125, 4.96484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 9.0, 17.0, 12.0, 23.0, 28.0, 51.0, 72.0, 74.0, 109.0, 169.0, 230.0, 306.0, 510.0, 629.0, 522.0, 408.0, 245.0, 185.0, 128.0, 89.0, 68.0, 38.0, 31.0, 33.0, 23.0, 16.0, 17.0, 5.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.113861083984375, -2.97576904296875, -2.837677001953125, -2.6995849609375, -2.561492919921875, -2.42340087890625, -2.285308837890625, -2.147216796875, -2.009124755859375, -1.87103271484375, -1.732940673828125, -1.5948486328125, -1.456756591796875, -1.31866455078125, -1.180572509765625, -1.04248046875, -0.904388427734375, -0.76629638671875, -0.628204345703125, -0.4901123046875, -0.352020263671875, -0.21392822265625, -0.075836181640625, 0.062255859375, 0.200347900390625, 0.33843994140625, 0.476531982421875, 0.6146240234375, 0.752716064453125, 0.89080810546875, 1.028900146484375, 1.1669921875, 1.305084228515625, 1.44317626953125, 1.581268310546875, 1.7193603515625, 1.857452392578125, 1.99554443359375, 2.133636474609375, 2.271728515625, 2.409820556640625, 2.54791259765625, 2.686004638671875, 2.8240966796875, 2.962188720703125, 3.10028076171875, 3.238372802734375, 3.37646484375, 3.514556884765625, 3.65264892578125, 3.790740966796875, 3.9288330078125, 4.066925048828125, 4.20501708984375, 4.343109130859375, 4.481201171875, 4.619293212890625, 4.75738525390625, 4.895477294921875, 5.0335693359375, 5.171661376953125, 5.30975341796875, 5.447845458984375, 5.5859375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 6.0, 9.0, 35.0, 90.0, 217.0, 293.0, 215.0, 95.0, 26.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.83698654174805, -57.022987365722656, -55.208984375, -53.39498519897461, -51.58098220825195, -49.76698303222656, -47.952980041503906, -46.138980865478516, -44.324981689453125, -42.510982513427734, -40.69697952270508, -38.88298034667969, -37.06897735595703, -35.25497817993164, -33.44097900390625, -31.626976013183594, -29.812973022460938, -27.998971939086914, -26.18497085571289, -24.3709716796875, -22.556968688964844, -20.742969512939453, -18.92896842956543, -17.114967346191406, -15.300966262817383, -13.48696517944336, -11.672964096069336, -9.858963966369629, -8.044962882995605, -6.230961799621582, -4.416961669921875, -2.6029605865478516, -0.7889633178710938, 1.0250375270843506, 2.839038372039795, 4.65303897857666, 6.467040061950684, 8.281041145324707, 10.095041275024414, 11.909042358398438, 13.723043441772461, 15.537044525146484, 17.351045608520508, 19.16504669189453, 20.979045867919922, 22.793048858642578, 24.60704803466797, 26.421049118041992, 28.235050201416016, 30.04905128479004, 31.863052368164062, 33.67705154418945, 35.49105453491211, 37.3050537109375, 39.119056701660156, 40.93305587768555, 42.74705505371094, 44.56105422973633, 46.375057220458984, 48.189056396484375, 50.00305938720703, 51.81705856323242, 53.63105773925781, 55.44506072998047, 57.259063720703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 10.0, 8.0, 8.0, 10.0, 17.0, 9.0, 14.0, 20.0, 28.0, 20.0, 32.0, 25.0, 31.0, 38.0, 26.0, 28.0, 37.0, 40.0, 36.0, 35.0, 41.0, 31.0, 45.0, 33.0, 43.0, 54.0, 43.0, 36.0, 26.0, 25.0, 28.0, 14.0, 17.0, 15.0, 17.0, 13.0, 10.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.789836883544922, -12.391395568847656, -11.99295425415039, -11.594512939453125, -11.19607162475586, -10.797630310058594, -10.399188995361328, -10.000747680664062, -9.602306365966797, -9.203865051269531, -8.805423736572266, -8.406982421875, -8.008541107177734, -7.610099792480469, -7.211658477783203, -6.8132171630859375, -6.41477632522583, -6.0163350105285645, -5.617893695831299, -5.219452381134033, -4.821011066436768, -4.422569751739502, -4.0241289138793945, -3.62568736076355, -3.227246046066284, -2.8288047313690186, -2.430363416671753, -2.0319223403930664, -1.6334809064865112, -1.2350395917892456, -0.8365983963012695, -0.4381570816040039, -0.03971576690673828, 0.35872551798820496, 0.7571668028831482, 1.155608057975769, 1.5540493726730347, 1.9524906873703003, 2.3509318828582764, 2.749373197555542, 3.1478145122528076, 3.5462558269500732, 3.944697141647339, 4.343138217926025, 4.741579532623291, 5.140020847320557, 5.538462162017822, 5.936903476715088, 6.3353447914123535, 6.733786106109619, 7.132227420806885, 7.53066873550415, 7.929110050201416, 8.327550888061523, 8.725992202758789, 9.124433517456055, 9.52287483215332, 9.921316146850586, 10.319757461547852, 10.718198776245117, 11.116640090942383, 11.515081405639648, 11.913522720336914, 12.31196403503418, 12.710405349731445]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 16.0, 16.0, 24.0, 38.0, 42.0, 86.0, 131.0, 183.0, 339.0, 518.0, 948.0, 1668.0, 3014.0, 5514.0, 10737.0, 21929.0, 45424.0, 90352.0, 159244.0, 216539.0, 204971.0, 137976.0, 74815.0, 36580.0, 17857.0, 8841.0, 4716.0, 2535.0, 1393.0, 807.0, 482.0, 320.0, 148.0, 134.0, 71.0, 46.0, 29.0, 13.0, 16.0, 8.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.9130859375, -1.8548583984375, -1.796630859375, -1.7384033203125, -1.68017578125, -1.6219482421875, -1.563720703125, -1.5054931640625, -1.447265625, -1.3890380859375, -1.330810546875, -1.2725830078125, -1.21435546875, -1.1561279296875, -1.097900390625, -1.0396728515625, -0.9814453125, -0.9232177734375, -0.864990234375, -0.8067626953125, -0.74853515625, -0.6903076171875, -0.632080078125, -0.5738525390625, -0.515625, -0.4573974609375, -0.399169921875, -0.3409423828125, -0.28271484375, -0.2244873046875, -0.166259765625, -0.1080322265625, -0.0498046875, 0.0084228515625, 0.066650390625, 0.1248779296875, 0.18310546875, 0.2413330078125, 0.299560546875, 0.3577880859375, 0.416015625, 0.4742431640625, 0.532470703125, 0.5906982421875, 0.64892578125, 0.7071533203125, 0.765380859375, 0.8236083984375, 0.8818359375, 0.9400634765625, 0.998291015625, 1.0565185546875, 1.11474609375, 1.1729736328125, 1.231201171875, 1.2894287109375, 1.34765625, 1.4058837890625, 1.464111328125, 1.5223388671875, 1.58056640625, 1.6387939453125, 1.697021484375, 1.7552490234375, 1.8134765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 11.0, 9.0, 8.0, 19.0, 13.0, 12.0, 28.0, 40.0, 30.0, 42.0, 39.0, 54.0, 47.0, 61.0, 55.0, 62.0, 59.0, 34.0, 59.0, 44.0, 42.0, 39.0, 42.0, 35.0, 20.0, 16.0, 30.0, 12.0, 8.0, 13.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.473846435546875, -1.40277099609375, -1.331695556640625, -1.2606201171875, -1.189544677734375, -1.11846923828125, -1.047393798828125, -0.976318359375, -0.905242919921875, -0.83416748046875, -0.763092041015625, -0.6920166015625, -0.620941162109375, -0.54986572265625, -0.478790283203125, -0.40771484375, -0.336639404296875, -0.26556396484375, -0.194488525390625, -0.1234130859375, -0.052337646484375, 0.01873779296875, 0.089813232421875, 0.160888671875, 0.231964111328125, 0.30303955078125, 0.374114990234375, 0.4451904296875, 0.516265869140625, 0.58734130859375, 0.658416748046875, 0.7294921875, 0.800567626953125, 0.87164306640625, 0.942718505859375, 1.0137939453125, 1.084869384765625, 1.15594482421875, 1.227020263671875, 1.298095703125, 1.369171142578125, 1.44024658203125, 1.511322021484375, 1.5823974609375, 1.653472900390625, 1.72454833984375, 1.795623779296875, 1.86669921875, 1.937774658203125, 2.00885009765625, 2.079925537109375, 2.1510009765625, 2.222076416015625, 2.29315185546875, 2.364227294921875, 2.435302734375, 2.506378173828125, 2.57745361328125, 2.648529052734375, 2.7196044921875, 2.790679931640625, 2.86175537109375, 2.932830810546875, 3.00390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 13.0, 23.0, 23.0, 25.0, 61.0, 110.0, 148.0, 233.0, 405.0, 713.0, 1476.0, 2910.0, 6636.0, 17009.0, 47724.0, 131961.0, 277248.0, 302332.0, 162466.0, 60138.0, 21452.0, 8116.0, 3505.0, 1644.0, 884.0, 473.0, 285.0, 171.0, 115.0, 78.0, 49.0, 38.0, 29.0, 12.0, 9.0, 5.0, 5.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.27545166015625, -2.1915283203125, -2.10760498046875, -2.023681640625, -1.93975830078125, -1.8558349609375, -1.77191162109375, -1.68798828125, -1.60406494140625, -1.5201416015625, -1.43621826171875, -1.352294921875, -1.26837158203125, -1.1844482421875, -1.10052490234375, -1.0166015625, -0.93267822265625, -0.8487548828125, -0.76483154296875, -0.680908203125, -0.59698486328125, -0.5130615234375, -0.42913818359375, -0.34521484375, -0.26129150390625, -0.1773681640625, -0.09344482421875, -0.009521484375, 0.07440185546875, 0.1583251953125, 0.24224853515625, 0.326171875, 0.41009521484375, 0.4940185546875, 0.57794189453125, 0.661865234375, 0.74578857421875, 0.8297119140625, 0.91363525390625, 0.99755859375, 1.08148193359375, 1.1654052734375, 1.24932861328125, 1.333251953125, 1.41717529296875, 1.5010986328125, 1.58502197265625, 1.6689453125, 1.75286865234375, 1.8367919921875, 1.92071533203125, 2.004638671875, 2.08856201171875, 2.1724853515625, 2.25640869140625, 2.34033203125, 2.42425537109375, 2.5081787109375, 2.59210205078125, 2.676025390625, 2.75994873046875, 2.8438720703125, 2.92779541015625, 3.01171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 9.0, 5.0, 5.0, 15.0, 10.0, 12.0, 25.0, 18.0, 20.0, 37.0, 38.0, 44.0, 46.0, 56.0, 48.0, 48.0, 43.0, 53.0, 51.0, 41.0, 41.0, 52.0, 53.0, 39.0, 40.0, 34.0, 26.0, 25.0, 23.0, 15.0, 9.0, 8.0, 6.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.70703125, -6.5067138671875, -6.306396484375, -6.1060791015625, -5.90576171875, -5.7054443359375, -5.505126953125, -5.3048095703125, -5.1044921875, -4.9041748046875, -4.703857421875, -4.5035400390625, -4.30322265625, -4.1029052734375, -3.902587890625, -3.7022705078125, -3.501953125, -3.3016357421875, -3.101318359375, -2.9010009765625, -2.70068359375, -2.5003662109375, -2.300048828125, -2.0997314453125, -1.8994140625, -1.6990966796875, -1.498779296875, -1.2984619140625, -1.09814453125, -0.8978271484375, -0.697509765625, -0.4971923828125, -0.296875, -0.0965576171875, 0.103759765625, 0.3040771484375, 0.50439453125, 0.7047119140625, 0.905029296875, 1.1053466796875, 1.3056640625, 1.5059814453125, 1.706298828125, 1.9066162109375, 2.10693359375, 2.3072509765625, 2.507568359375, 2.7078857421875, 2.908203125, 3.1085205078125, 3.308837890625, 3.5091552734375, 3.70947265625, 3.9097900390625, 4.110107421875, 4.3104248046875, 4.5107421875, 4.7110595703125, 4.911376953125, 5.1116943359375, 5.31201171875, 5.5123291015625, 5.712646484375, 5.9129638671875, 6.11328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 7.0, 8.0, 18.0, 11.0, 14.0, 40.0, 67.0, 98.0, 153.0, 233.0, 443.0, 777.0, 1380.0, 2783.0, 5358.0, 10898.0, 21730.0, 44300.0, 88553.0, 158231.0, 221579.0, 208569.0, 137132.0, 73341.0, 36640.0, 17853.0, 8756.0, 4414.0, 2307.0, 1198.0, 662.0, 403.0, 204.0, 122.0, 96.0, 57.0, 31.0, 31.0, 16.0, 14.0, 11.0, 10.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8592605590820312, -0.8322906494140625, -0.8053207397460938, -0.778350830078125, -0.7513809204101562, -0.7244110107421875, -0.6974411010742188, -0.67047119140625, -0.6435012817382812, -0.6165313720703125, -0.5895614624023438, -0.562591552734375, -0.5356216430664062, -0.5086517333984375, -0.48168182373046875, -0.4547119140625, -0.42774200439453125, -0.4007720947265625, -0.37380218505859375, -0.346832275390625, -0.31986236572265625, -0.2928924560546875, -0.26592254638671875, -0.23895263671875, -0.21198272705078125, -0.1850128173828125, -0.15804290771484375, -0.131072998046875, -0.10410308837890625, -0.0771331787109375, -0.05016326904296875, -0.023193359375, 0.00377655029296875, 0.0307464599609375, 0.05771636962890625, 0.084686279296875, 0.11165618896484375, 0.1386260986328125, 0.16559600830078125, 0.19256591796875, 0.21953582763671875, 0.2465057373046875, 0.27347564697265625, 0.300445556640625, 0.32741546630859375, 0.3543853759765625, 0.38135528564453125, 0.4083251953125, 0.43529510498046875, 0.4622650146484375, 0.48923492431640625, 0.516204833984375, 0.5431747436523438, 0.5701446533203125, 0.5971145629882812, 0.62408447265625, 0.6510543823242188, 0.6780242919921875, 0.7049942016601562, 0.731964111328125, 0.7589340209960938, 0.7859039306640625, 0.8128738403320312, 0.83984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 7.0, 5.0, 4.0, 8.0, 8.0, 11.0, 11.0, 14.0, 18.0, 26.0, 23.0, 26.0, 37.0, 36.0, 64.0, 53.0, 68.0, 72.0, 70.0, 50.0, 59.0, 64.0, 46.0, 42.0, 26.0, 27.0, 26.0, 15.0, 16.0, 13.0, 12.0, 8.0, 8.0, 5.0, 10.0, 2.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002887248992919922, -0.00028036534786224365, -0.0002720057964324951, -0.0002636462450027466, -0.00025528669357299805, -0.0002469271421432495, -0.00023856759071350098, -0.00023020803928375244, -0.0002218484878540039, -0.00021348893642425537, -0.00020512938499450684, -0.0001967698335647583, -0.00018841028213500977, -0.00018005073070526123, -0.0001716911792755127, -0.00016333162784576416, -0.00015497207641601562, -0.0001466125249862671, -0.00013825297355651855, -0.00012989342212677002, -0.00012153387069702148, -0.00011317431926727295, -0.00010481476783752441, -9.645521640777588e-05, -8.809566497802734e-05, -7.973611354827881e-05, -7.137656211853027e-05, -6.301701068878174e-05, -5.46574592590332e-05, -4.629790782928467e-05, -3.793835639953613e-05, -2.9578804969787598e-05, -2.1219253540039062e-05, -1.2859702110290527e-05, -4.500150680541992e-06, 3.859400749206543e-06, 1.2218952178955078e-05, 2.0578503608703613e-05, 2.893805503845215e-05, 3.7297606468200684e-05, 4.565715789794922e-05, 5.4016709327697754e-05, 6.237626075744629e-05, 7.073581218719482e-05, 7.909536361694336e-05, 8.74549150466919e-05, 9.581446647644043e-05, 0.00010417401790618896, 0.0001125335693359375, 0.00012089312076568604, 0.00012925267219543457, 0.0001376122236251831, 0.00014597177505493164, 0.00015433132648468018, 0.0001626908779144287, 0.00017105042934417725, 0.00017940998077392578, 0.00018776953220367432, 0.00019612908363342285, 0.0002044886350631714, 0.00021284818649291992, 0.00022120773792266846, 0.000229567289352417, 0.00023792684078216553, 0.00024628639221191406]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 10.0, 13.0, 18.0, 23.0, 67.0, 78.0, 141.0, 277.0, 482.0, 937.0, 1985.0, 4340.0, 10329.0, 24901.0, 61953.0, 139045.0, 239127.0, 258411.0, 169475.0, 79592.0, 33146.0, 13368.0, 5693.0, 2570.0, 1218.0, 599.0, 299.0, 173.0, 119.0, 53.0, 37.0, 33.0, 8.0, 10.0, 9.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91650390625, -0.8850631713867188, -0.8536224365234375, -0.8221817016601562, -0.790740966796875, -0.7593002319335938, -0.7278594970703125, -0.6964187622070312, -0.66497802734375, -0.6335372924804688, -0.6020965576171875, -0.5706558227539062, -0.539215087890625, -0.5077743530273438, -0.4763336181640625, -0.44489288330078125, -0.4134521484375, -0.38201141357421875, -0.3505706787109375, -0.31912994384765625, -0.287689208984375, -0.25624847412109375, -0.2248077392578125, -0.19336700439453125, -0.16192626953125, -0.13048553466796875, -0.0990447998046875, -0.06760406494140625, -0.036163330078125, -0.00472259521484375, 0.0267181396484375, 0.05815887451171875, 0.089599609375, 0.12104034423828125, 0.1524810791015625, 0.18392181396484375, 0.215362548828125, 0.24680328369140625, 0.2782440185546875, 0.30968475341796875, 0.34112548828125, 0.37256622314453125, 0.4040069580078125, 0.43544769287109375, 0.466888427734375, 0.49832916259765625, 0.5297698974609375, 0.5612106323242188, 0.5926513671875, 0.6240921020507812, 0.6555328369140625, 0.6869735717773438, 0.718414306640625, 0.7498550415039062, 0.7812957763671875, 0.8127365112304688, 0.84417724609375, 0.8756179809570312, 0.9070587158203125, 0.9384994506835938, 0.969940185546875, 1.0013809204101562, 1.0328216552734375, 1.0642623901367188, 1.095703125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 10.0, 14.0, 11.0, 17.0, 25.0, 21.0, 23.0, 18.0, 31.0, 36.0, 40.0, 55.0, 42.0, 71.0, 50.0, 63.0, 55.0, 45.0, 56.0, 51.0, 30.0, 31.0, 37.0, 27.0, 30.0, 25.0, 18.0, 19.0, 8.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.162109375, -1.1287155151367188, -1.0953216552734375, -1.0619277954101562, -1.028533935546875, -0.9951400756835938, -0.9617462158203125, -0.9283523559570312, -0.89495849609375, -0.8615646362304688, -0.8281707763671875, -0.7947769165039062, -0.761383056640625, -0.7279891967773438, -0.6945953369140625, -0.6612014770507812, -0.6278076171875, -0.5944137573242188, -0.5610198974609375, -0.5276260375976562, -0.494232177734375, -0.46083831787109375, -0.4274444580078125, -0.39405059814453125, -0.36065673828125, -0.32726287841796875, -0.2938690185546875, -0.26047515869140625, -0.227081298828125, -0.19368743896484375, -0.1602935791015625, -0.12689971923828125, -0.093505859375, -0.06011199951171875, -0.0267181396484375, 0.00667572021484375, 0.040069580078125, 0.07346343994140625, 0.1068572998046875, 0.14025115966796875, 0.17364501953125, 0.20703887939453125, 0.2404327392578125, 0.27382659912109375, 0.307220458984375, 0.34061431884765625, 0.3740081787109375, 0.40740203857421875, 0.4407958984375, 0.47418975830078125, 0.5075836181640625, 0.5409774780273438, 0.574371337890625, 0.6077651977539062, 0.6411590576171875, 0.6745529174804688, 0.70794677734375, 0.7413406372070312, 0.7747344970703125, 0.8081283569335938, 0.841522216796875, 0.8749160766601562, 0.9083099365234375, 0.9417037963867188, 0.97509765625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 9.0, 13.0, 20.0, 86.0, 174.0, 259.0, 200.0, 133.0, 71.0, 22.0, 7.0, 2.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.65446472167969, -31.742692947387695, -30.830921173095703, -29.91914939880371, -29.00737762451172, -28.09560775756836, -27.183834075927734, -26.272064208984375, -25.360292434692383, -24.44852066040039, -23.5367488861084, -22.624977111816406, -21.713205337524414, -20.801433563232422, -19.889663696289062, -18.97789192199707, -18.066120147705078, -17.154348373413086, -16.242576599121094, -15.330804824829102, -14.419034004211426, -13.507262229919434, -12.595490455627441, -11.683719635009766, -10.77194595336914, -9.860174179077148, -8.948402404785156, -8.036630630493164, -7.124859809875488, -6.213088035583496, -5.301316261291504, -4.38954496383667, -3.477773666381836, -2.566002130508423, -1.6542304754257202, -0.7424588203430176, 0.1693127155303955, 1.0810842514038086, 1.9928560256958008, 2.9046273231506348, 3.816399097442627, 4.728170871734619, 5.639942169189453, 6.551713943481445, 7.4634857177734375, 8.37525749206543, 9.287029266357422, 10.198800086975098, 11.11057186126709, 12.022343635559082, 12.934115409851074, 13.84588623046875, 14.757658004760742, 15.669429779052734, 16.581201553344727, 17.49297332763672, 18.40474510192871, 19.316516876220703, 20.228288650512695, 21.140060424804688, 22.05183219909668, 22.963603973388672, 23.87537384033203, 24.787145614624023, 25.698917388916016]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 10.0, 11.0, 17.0, 19.0, 16.0, 18.0, 13.0, 15.0, 26.0, 27.0, 26.0, 43.0, 37.0, 46.0, 36.0, 41.0, 39.0, 45.0, 50.0, 37.0, 40.0, 31.0, 38.0, 35.0, 38.0, 27.0, 30.0, 27.0, 24.0, 19.0, 25.0, 12.0, 8.0, 13.0, 8.0, 12.0, 10.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.338685989379883, -14.875646591186523, -14.41260814666748, -13.949569702148438, -13.486530303955078, -13.023490905761719, -12.560452461242676, -12.097414016723633, -11.634374618530273, -11.171335220336914, -10.708296775817871, -10.245258331298828, -9.782218933105469, -9.31917953491211, -8.856141090393066, -8.393102645874023, -7.930063247680664, -7.467024326324463, -7.003985404968262, -6.5409464836120605, -6.077907562255859, -5.614868640899658, -5.151829719543457, -4.688790798187256, -4.225751876831055, -3.7627129554748535, -3.2996740341186523, -2.836635112762451, -2.37359619140625, -1.9105572700500488, -1.4475183486938477, -0.9844794273376465, -0.5214405059814453, -0.05840158462524414, 0.40463733673095703, 0.8676762580871582, 1.3307151794433594, 1.7937541007995605, 2.2567930221557617, 2.719831943511963, 3.182870864868164, 3.6459097862243652, 4.108948707580566, 4.571987628936768, 5.035026550292969, 5.49806547164917, 5.961104393005371, 6.424143314361572, 6.887182235717773, 7.350221157073975, 7.813260078430176, 8.276298522949219, 8.739337921142578, 9.202377319335938, 9.66541576385498, 10.128454208374023, 10.591493606567383, 11.054533004760742, 11.517571449279785, 11.980609893798828, 12.443649291992188, 12.906688690185547, 13.36972713470459, 13.832765579223633, 14.295804977416992]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 8.0, 16.0, 31.0, 32.0, 99.0, 169.0, 353.0, 661.0, 1421.0, 3081.0, 7308.0, 19262.0, 61370.0, 248718.0, 1055858.0, 1922754.0, 669899.0, 143621.0, 37275.0, 12338.0, 5030.0, 2273.0, 1148.0, 635.0, 335.0, 190.0, 118.0, 82.0, 55.0, 39.0, 18.0, 21.0, 24.0, 12.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.17578125, -2.089874267578125, -2.00396728515625, -1.918060302734375, -1.8321533203125, -1.746246337890625, -1.66033935546875, -1.574432373046875, -1.488525390625, -1.402618408203125, -1.31671142578125, -1.230804443359375, -1.1448974609375, -1.058990478515625, -0.97308349609375, -0.887176513671875, -0.80126953125, -0.715362548828125, -0.62945556640625, -0.543548583984375, -0.4576416015625, -0.371734619140625, -0.28582763671875, -0.199920654296875, -0.114013671875, -0.028106689453125, 0.05780029296875, 0.143707275390625, 0.2296142578125, 0.315521240234375, 0.40142822265625, 0.487335205078125, 0.5732421875, 0.659149169921875, 0.74505615234375, 0.830963134765625, 0.9168701171875, 1.002777099609375, 1.08868408203125, 1.174591064453125, 1.260498046875, 1.346405029296875, 1.43231201171875, 1.518218994140625, 1.6041259765625, 1.690032958984375, 1.77593994140625, 1.861846923828125, 1.94775390625, 2.033660888671875, 2.11956787109375, 2.205474853515625, 2.2913818359375, 2.377288818359375, 2.46319580078125, 2.549102783203125, 2.635009765625, 2.720916748046875, 2.80682373046875, 2.892730712890625, 2.9786376953125, 3.064544677734375, 3.15045166015625, 3.236358642578125, 3.322265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 9.0, 9.0, 12.0, 16.0, 21.0, 20.0, 20.0, 24.0, 30.0, 41.0, 42.0, 40.0, 50.0, 49.0, 56.0, 38.0, 53.0, 49.0, 44.0, 44.0, 42.0, 40.0, 39.0, 29.0, 29.0, 24.0, 30.0, 19.0, 17.0, 12.0, 12.0, 7.0, 10.0, 5.0, 6.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.23046875, -2.157379150390625, -2.08428955078125, -2.011199951171875, -1.9381103515625, -1.865020751953125, -1.79193115234375, -1.718841552734375, -1.645751953125, -1.572662353515625, -1.49957275390625, -1.426483154296875, -1.3533935546875, -1.280303955078125, -1.20721435546875, -1.134124755859375, -1.06103515625, -0.987945556640625, -0.91485595703125, -0.841766357421875, -0.7686767578125, -0.695587158203125, -0.62249755859375, -0.549407958984375, -0.476318359375, -0.403228759765625, -0.33013916015625, -0.257049560546875, -0.1839599609375, -0.110870361328125, -0.03778076171875, 0.035308837890625, 0.1083984375, 0.181488037109375, 0.25457763671875, 0.327667236328125, 0.4007568359375, 0.473846435546875, 0.54693603515625, 0.620025634765625, 0.693115234375, 0.766204833984375, 0.83929443359375, 0.912384033203125, 0.9854736328125, 1.058563232421875, 1.13165283203125, 1.204742431640625, 1.27783203125, 1.350921630859375, 1.42401123046875, 1.497100830078125, 1.5701904296875, 1.643280029296875, 1.71636962890625, 1.789459228515625, 1.862548828125, 1.935638427734375, 2.00872802734375, 2.081817626953125, 2.1549072265625, 2.227996826171875, 2.30108642578125, 2.374176025390625, 2.447265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 3.0, 10.0, 10.0, 8.0, 23.0, 33.0, 49.0, 76.0, 122.0, 214.0, 362.0, 608.0, 1239.0, 2830.0, 7202.0, 21154.0, 75416.0, 347314.0, 2280736.0, 1199859.0, 188520.0, 45679.0, 13686.0, 4922.0, 2005.0, 984.0, 500.0, 266.0, 165.0, 104.0, 57.0, 40.0, 27.0, 22.0, 7.0, 9.0, 11.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.56640625, -3.44677734375, -3.3271484375, -3.20751953125, -3.087890625, -2.96826171875, -2.8486328125, -2.72900390625, -2.609375, -2.48974609375, -2.3701171875, -2.25048828125, -2.130859375, -2.01123046875, -1.8916015625, -1.77197265625, -1.65234375, -1.53271484375, -1.4130859375, -1.29345703125, -1.173828125, -1.05419921875, -0.9345703125, -0.81494140625, -0.6953125, -0.57568359375, -0.4560546875, -0.33642578125, -0.216796875, -0.09716796875, 0.0224609375, 0.14208984375, 0.26171875, 0.38134765625, 0.5009765625, 0.62060546875, 0.740234375, 0.85986328125, 0.9794921875, 1.09912109375, 1.21875, 1.33837890625, 1.4580078125, 1.57763671875, 1.697265625, 1.81689453125, 1.9365234375, 2.05615234375, 2.17578125, 2.29541015625, 2.4150390625, 2.53466796875, 2.654296875, 2.77392578125, 2.8935546875, 3.01318359375, 3.1328125, 3.25244140625, 3.3720703125, 3.49169921875, 3.611328125, 3.73095703125, 3.8505859375, 3.97021484375, 4.08984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 5.0, 13.0, 11.0, 26.0, 22.0, 43.0, 47.0, 47.0, 96.0, 141.0, 225.0, 386.0, 633.0, 790.0, 569.0, 354.0, 206.0, 155.0, 96.0, 58.0, 32.0, 29.0, 25.0, 14.0, 13.0, 9.0, 12.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21484375, -4.07171630859375, -3.9285888671875, -3.78546142578125, -3.642333984375, -3.49920654296875, -3.3560791015625, -3.21295166015625, -3.06982421875, -2.92669677734375, -2.7835693359375, -2.64044189453125, -2.497314453125, -2.35418701171875, -2.2110595703125, -2.06793212890625, -1.9248046875, -1.78167724609375, -1.6385498046875, -1.49542236328125, -1.352294921875, -1.20916748046875, -1.0660400390625, -0.92291259765625, -0.77978515625, -0.63665771484375, -0.4935302734375, -0.35040283203125, -0.207275390625, -0.06414794921875, 0.0789794921875, 0.22210693359375, 0.365234375, 0.50836181640625, 0.6514892578125, 0.79461669921875, 0.937744140625, 1.08087158203125, 1.2239990234375, 1.36712646484375, 1.51025390625, 1.65338134765625, 1.7965087890625, 1.93963623046875, 2.082763671875, 2.22589111328125, 2.3690185546875, 2.51214599609375, 2.6552734375, 2.79840087890625, 2.9415283203125, 3.08465576171875, 3.227783203125, 3.37091064453125, 3.5140380859375, 3.65716552734375, 3.80029296875, 3.94342041015625, 4.0865478515625, 4.22967529296875, 4.372802734375, 4.51593017578125, 4.6590576171875, 4.80218505859375, 4.9453125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 32.0, 60.0, 166.0, 225.0, 250.0, 151.0, 66.0, 26.0, 10.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.8653564453125, -54.594322204589844, -53.32328796386719, -52.0522575378418, -50.78122329711914, -49.510189056396484, -48.239158630371094, -46.96812438964844, -45.69709014892578, -44.426055908203125, -43.15502166748047, -41.88399124145508, -40.61295700073242, -39.341922760009766, -38.070892333984375, -36.79985809326172, -35.52882385253906, -34.257789611816406, -32.98675537109375, -31.71572494506836, -30.444690704345703, -29.173656463623047, -27.902624130249023, -26.631591796875, -25.360557556152344, -24.089523315429688, -22.818490982055664, -21.54745864868164, -20.276424407958984, -19.005390167236328, -17.734357833862305, -16.46332550048828, -15.192291259765625, -13.921257972717285, -12.650224685668945, -11.379191398620605, -10.108158111572266, -8.837124824523926, -7.566091537475586, -6.295058250427246, -5.024024963378906, -3.7529916763305664, -2.4819583892822266, -1.2109251022338867, 0.060108184814453125, 1.331141471862793, 2.602174758911133, 3.8732080459594727, 5.1442413330078125, 6.415274620056152, 7.686307907104492, 8.957341194152832, 10.228374481201172, 11.499407768249512, 12.770441055297852, 14.041474342346191, 15.312507629394531, 16.583541870117188, 17.85457420349121, 19.125606536865234, 20.39664077758789, 21.667675018310547, 22.93870735168457, 24.209739685058594, 25.48077392578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 3.0, 18.0, 11.0, 9.0, 12.0, 12.0, 19.0, 16.0, 16.0, 21.0, 17.0, 26.0, 34.0, 32.0, 35.0, 37.0, 33.0, 40.0, 40.0, 41.0, 32.0, 40.0, 39.0, 33.0, 33.0, 31.0, 35.0, 35.0, 26.0, 20.0, 21.0, 26.0, 30.0, 17.0, 16.0, 11.0, 11.0, 13.0, 11.0, 6.0, 6.0, 6.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-10.014322280883789, -9.704379081726074, -9.39443588256836, -9.084493637084961, -8.774550437927246, -8.464607238769531, -8.154664039611816, -7.844720840454102, -7.534777641296387, -7.224834442138672, -6.914891719818115, -6.6049485206604, -6.2950053215026855, -5.985062599182129, -5.675119400024414, -5.365176200866699, -5.055233478546143, -4.745290279388428, -4.435347557067871, -4.125404357910156, -3.8154611587524414, -3.5055181980133057, -3.19557523727417, -2.885632038116455, -2.5756890773773193, -2.2657461166381836, -1.9558029174804688, -1.645859956741333, -1.3359168767929077, -1.0259737968444824, -0.7160308361053467, -0.40608763694763184, -0.0961446762084961, 0.2137983739376068, 0.5237414240837097, 0.8336844444274902, 1.1436275243759155, 1.4535706043243408, 1.7635135650634766, 2.0734567642211914, 2.383399724960327, 2.693342685699463, 3.0032858848571777, 3.3132288455963135, 3.623171806335449, 3.933115005493164, 4.243058204650879, 4.553001403808594, 4.86294412612915, 5.172887325286865, 5.482830047607422, 5.792773246765137, 6.102716445922852, 6.412659645080566, 6.722602367401123, 7.032545566558838, 7.3424882888793945, 7.652431488037109, 7.962374210357666, 8.272317886352539, 8.582260131835938, 8.892203330993652, 9.202146530151367, 9.512089729309082, 9.822032928466797]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 3.0, 10.0, 14.0, 9.0, 23.0, 30.0, 47.0, 71.0, 99.0, 211.0, 365.0, 599.0, 1225.0, 2607.0, 5247.0, 11296.0, 27321.0, 89113.0, 300838.0, 393388.0, 145824.0, 41225.0, 15106.0, 6833.0, 3376.0, 1672.0, 895.0, 476.0, 245.0, 154.0, 80.0, 51.0, 36.0, 17.0, 19.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.712890625, -3.593841552734375, -3.47479248046875, -3.355743408203125, -3.2366943359375, -3.117645263671875, -2.99859619140625, -2.879547119140625, -2.760498046875, -2.641448974609375, -2.52239990234375, -2.403350830078125, -2.2843017578125, -2.165252685546875, -2.04620361328125, -1.927154541015625, -1.80810546875, -1.689056396484375, -1.57000732421875, -1.450958251953125, -1.3319091796875, -1.212860107421875, -1.09381103515625, -0.974761962890625, -0.855712890625, -0.736663818359375, -0.61761474609375, -0.498565673828125, -0.3795166015625, -0.260467529296875, -0.14141845703125, -0.022369384765625, 0.0966796875, 0.215728759765625, 0.33477783203125, 0.453826904296875, 0.5728759765625, 0.691925048828125, 0.81097412109375, 0.930023193359375, 1.049072265625, 1.168121337890625, 1.28717041015625, 1.406219482421875, 1.5252685546875, 1.644317626953125, 1.76336669921875, 1.882415771484375, 2.00146484375, 2.120513916015625, 2.23956298828125, 2.358612060546875, 2.4776611328125, 2.596710205078125, 2.71575927734375, 2.834808349609375, 2.953857421875, 3.072906494140625, 3.19195556640625, 3.311004638671875, 3.4300537109375, 3.549102783203125, 3.66815185546875, 3.787200927734375, 3.90625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 8.0, 7.0, 3.0, 8.0, 8.0, 15.0, 16.0, 17.0, 21.0, 27.0, 33.0, 36.0, 48.0, 35.0, 38.0, 57.0, 48.0, 58.0, 51.0, 48.0, 48.0, 45.0, 51.0, 50.0, 36.0, 34.0, 29.0, 18.0, 16.0, 15.0, 19.0, 9.0, 11.0, 8.0, 11.0, 7.0, 8.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.6155242919921875, -1.544525146484375, -1.4735260009765625, -1.40252685546875, -1.3315277099609375, -1.260528564453125, -1.1895294189453125, -1.1185302734375, -1.0475311279296875, -0.976531982421875, -0.9055328369140625, -0.83453369140625, -0.7635345458984375, -0.692535400390625, -0.6215362548828125, -0.550537109375, -0.4795379638671875, -0.408538818359375, -0.3375396728515625, -0.26654052734375, -0.1955413818359375, -0.124542236328125, -0.0535430908203125, 0.0174560546875, 0.0884552001953125, 0.159454345703125, 0.2304534912109375, 0.30145263671875, 0.3724517822265625, 0.443450927734375, 0.5144500732421875, 0.58544921875, 0.6564483642578125, 0.727447509765625, 0.7984466552734375, 0.86944580078125, 0.9404449462890625, 1.011444091796875, 1.0824432373046875, 1.1534423828125, 1.2244415283203125, 1.295440673828125, 1.3664398193359375, 1.43743896484375, 1.5084381103515625, 1.579437255859375, 1.6504364013671875, 1.721435546875, 1.7924346923828125, 1.863433837890625, 1.9344329833984375, 2.00543212890625, 2.0764312744140625, 2.147430419921875, 2.2184295654296875, 2.2894287109375, 2.3604278564453125, 2.431427001953125, 2.5024261474609375, 2.57342529296875, 2.6444244384765625, 2.715423583984375, 2.7864227294921875, 2.857421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 4.0, 12.0, 11.0, 15.0, 19.0, 38.0, 43.0, 61.0, 63.0, 117.0, 221.0, 325.0, 616.0, 1014.0, 1971.0, 3408.0, 6317.0, 12293.0, 25411.0, 57903.0, 149352.0, 311297.0, 272042.0, 116766.0, 45777.0, 20757.0, 10479.0, 5372.0, 2941.0, 1502.0, 935.0, 523.0, 308.0, 203.0, 126.0, 88.0, 53.0, 49.0, 29.0, 20.0, 16.0, 17.0, 11.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.73828125, -2.6466064453125, -2.554931640625, -2.4632568359375, -2.37158203125, -2.2799072265625, -2.188232421875, -2.0965576171875, -2.0048828125, -1.9132080078125, -1.821533203125, -1.7298583984375, -1.63818359375, -1.5465087890625, -1.454833984375, -1.3631591796875, -1.271484375, -1.1798095703125, -1.088134765625, -0.9964599609375, -0.90478515625, -0.8131103515625, -0.721435546875, -0.6297607421875, -0.5380859375, -0.4464111328125, -0.354736328125, -0.2630615234375, -0.17138671875, -0.0797119140625, 0.011962890625, 0.1036376953125, 0.1953125, 0.2869873046875, 0.378662109375, 0.4703369140625, 0.56201171875, 0.6536865234375, 0.745361328125, 0.8370361328125, 0.9287109375, 1.0203857421875, 1.112060546875, 1.2037353515625, 1.29541015625, 1.3870849609375, 1.478759765625, 1.5704345703125, 1.662109375, 1.7537841796875, 1.845458984375, 1.9371337890625, 2.02880859375, 2.1204833984375, 2.212158203125, 2.3038330078125, 2.3955078125, 2.4871826171875, 2.578857421875, 2.6705322265625, 2.76220703125, 2.8538818359375, 2.945556640625, 3.0372314453125, 3.12890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 2.0, 7.0, 9.0, 8.0, 12.0, 13.0, 21.0, 13.0, 23.0, 23.0, 25.0, 31.0, 32.0, 38.0, 40.0, 51.0, 59.0, 37.0, 51.0, 50.0, 40.0, 40.0, 50.0, 37.0, 36.0, 36.0, 25.0, 22.0, 18.0, 29.0, 20.0, 18.0, 17.0, 10.0, 5.0, 5.0, 4.0, 6.0, 6.0, 4.0, 6.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-6.48046875, -6.26605224609375, -6.0516357421875, -5.83721923828125, -5.622802734375, -5.40838623046875, -5.1939697265625, -4.97955322265625, -4.76513671875, -4.55072021484375, -4.3363037109375, -4.12188720703125, -3.907470703125, -3.69305419921875, -3.4786376953125, -3.26422119140625, -3.0498046875, -2.83538818359375, -2.6209716796875, -2.40655517578125, -2.192138671875, -1.97772216796875, -1.7633056640625, -1.54888916015625, -1.33447265625, -1.12005615234375, -0.9056396484375, -0.69122314453125, -0.476806640625, -0.26239013671875, -0.0479736328125, 0.16644287109375, 0.380859375, 0.59527587890625, 0.8096923828125, 1.02410888671875, 1.238525390625, 1.45294189453125, 1.6673583984375, 1.88177490234375, 2.09619140625, 2.31060791015625, 2.5250244140625, 2.73944091796875, 2.953857421875, 3.16827392578125, 3.3826904296875, 3.59710693359375, 3.8115234375, 4.02593994140625, 4.2403564453125, 4.45477294921875, 4.669189453125, 4.88360595703125, 5.0980224609375, 5.31243896484375, 5.52685546875, 5.74127197265625, 5.9556884765625, 6.17010498046875, 6.384521484375, 6.59893798828125, 6.8133544921875, 7.02777099609375, 7.2421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 5.0, 14.0, 27.0, 39.0, 61.0, 86.0, 134.0, 194.0, 317.0, 486.0, 784.0, 1273.0, 2142.0, 3486.0, 5674.0, 10381.0, 20005.0, 46476.0, 119441.0, 282416.0, 310863.0, 139543.0, 53877.0, 23150.0, 11544.0, 6402.0, 3747.0, 2305.0, 1365.0, 863.0, 515.0, 312.0, 223.0, 136.0, 111.0, 57.0, 42.0, 25.0, 11.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0712890625, -1.034454345703125, -0.99761962890625, -0.960784912109375, -0.9239501953125, -0.887115478515625, -0.85028076171875, -0.813446044921875, -0.776611328125, -0.739776611328125, -0.70294189453125, -0.666107177734375, -0.6292724609375, -0.592437744140625, -0.55560302734375, -0.518768310546875, -0.48193359375, -0.445098876953125, -0.40826416015625, -0.371429443359375, -0.3345947265625, -0.297760009765625, -0.26092529296875, -0.224090576171875, -0.187255859375, -0.150421142578125, -0.11358642578125, -0.076751708984375, -0.0399169921875, -0.003082275390625, 0.03375244140625, 0.070587158203125, 0.107421875, 0.144256591796875, 0.18109130859375, 0.217926025390625, 0.2547607421875, 0.291595458984375, 0.32843017578125, 0.365264892578125, 0.402099609375, 0.438934326171875, 0.47576904296875, 0.512603759765625, 0.5494384765625, 0.586273193359375, 0.62310791015625, 0.659942626953125, 0.69677734375, 0.733612060546875, 0.77044677734375, 0.807281494140625, 0.8441162109375, 0.880950927734375, 0.91778564453125, 0.954620361328125, 0.991455078125, 1.028289794921875, 1.06512451171875, 1.101959228515625, 1.1387939453125, 1.175628662109375, 1.21246337890625, 1.249298095703125, 1.2861328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 14.0, 9.0, 16.0, 32.0, 54.0, 72.0, 128.0, 183.0, 147.0, 104.0, 54.0, 59.0, 37.0, 21.0, 13.0, 9.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006761550903320312, -0.0006555542349815369, -0.0006349533796310425, -0.0006143525242805481, -0.0005937516689300537, -0.0005731508135795593, -0.0005525499582290649, -0.0005319491028785706, -0.0005113482475280762, -0.0004907473921775818, -0.0004701465368270874, -0.000449545681476593, -0.00042894482612609863, -0.00040834397077560425, -0.00038774311542510986, -0.0003671422600746155, -0.0003465414047241211, -0.0003259405493736267, -0.0003053396940231323, -0.00028473883867263794, -0.00026413798332214355, -0.00024353712797164917, -0.00022293627262115479, -0.0002023354172706604, -0.00018173456192016602, -0.00016113370656967163, -0.00014053285121917725, -0.00011993199586868286, -9.933114051818848e-05, -7.873028516769409e-05, -5.812942981719971e-05, -3.752857446670532e-05, -1.6927719116210938e-05, 3.6731362342834473e-06, 2.4273991584777832e-05, 4.487484693527222e-05, 6.54757022857666e-05, 8.607655763626099e-05, 0.00010667741298675537, 0.00012727826833724976, 0.00014787912368774414, 0.00016847997903823853, 0.0001890808343887329, 0.0002096816897392273, 0.00023028254508972168, 0.00025088340044021606, 0.00027148425579071045, 0.00029208511114120483, 0.0003126859664916992, 0.0003332868218421936, 0.000353887677192688, 0.0003744885325431824, 0.00039508938789367676, 0.00041569024324417114, 0.00043629109859466553, 0.0004568919539451599, 0.0004774928092956543, 0.0004980936646461487, 0.0005186945199966431, 0.0005392953753471375, 0.0005598962306976318, 0.0005804970860481262, 0.0006010979413986206, 0.000621698796749115, 0.0006422996520996094]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 10.0, 7.0, 15.0, 21.0, 27.0, 43.0, 71.0, 100.0, 157.0, 242.0, 399.0, 676.0, 1195.0, 2051.0, 3620.0, 6650.0, 13219.0, 27648.0, 59486.0, 129740.0, 234820.0, 259966.0, 161617.0, 76939.0, 34703.0, 16552.0, 8218.0, 4413.0, 2407.0, 1424.0, 777.0, 503.0, 293.0, 192.0, 113.0, 69.0, 62.0, 30.0, 18.0, 20.0, 11.0, 8.0, 8.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0009765625, -0.9716720581054688, -0.9423675537109375, -0.9130630493164062, -0.883758544921875, -0.8544540405273438, -0.8251495361328125, -0.7958450317382812, -0.76654052734375, -0.7372360229492188, -0.7079315185546875, -0.6786270141601562, -0.649322509765625, -0.6200180053710938, -0.5907135009765625, -0.5614089965820312, -0.5321044921875, -0.5027999877929688, -0.4734954833984375, -0.44419097900390625, -0.414886474609375, -0.38558197021484375, -0.3562774658203125, -0.32697296142578125, -0.29766845703125, -0.26836395263671875, -0.2390594482421875, -0.20975494384765625, -0.180450439453125, -0.15114593505859375, -0.1218414306640625, -0.09253692626953125, -0.063232421875, -0.03392791748046875, -0.0046234130859375, 0.02468109130859375, 0.053985595703125, 0.08329010009765625, 0.1125946044921875, 0.14189910888671875, 0.17120361328125, 0.20050811767578125, 0.2298126220703125, 0.25911712646484375, 0.288421630859375, 0.31772613525390625, 0.3470306396484375, 0.37633514404296875, 0.4056396484375, 0.43494415283203125, 0.4642486572265625, 0.49355316162109375, 0.522857666015625, 0.5521621704101562, 0.5814666748046875, 0.6107711791992188, 0.64007568359375, 0.6693801879882812, 0.6986846923828125, 0.7279891967773438, 0.757293701171875, 0.7865982055664062, 0.8159027099609375, 0.8452072143554688, 0.87451171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 6.0, 9.0, 3.0, 16.0, 8.0, 14.0, 17.0, 30.0, 34.0, 39.0, 42.0, 56.0, 42.0, 65.0, 63.0, 59.0, 70.0, 62.0, 56.0, 54.0, 42.0, 29.0, 39.0, 19.0, 19.0, 19.0, 13.0, 13.0, 5.0, 2.0, 6.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.166015625, -1.1263580322265625, -1.086700439453125, -1.0470428466796875, -1.00738525390625, -0.9677276611328125, -0.928070068359375, -0.8884124755859375, -0.8487548828125, -0.8090972900390625, -0.769439697265625, -0.7297821044921875, -0.69012451171875, -0.6504669189453125, -0.610809326171875, -0.5711517333984375, -0.531494140625, -0.4918365478515625, -0.452178955078125, -0.4125213623046875, -0.37286376953125, -0.3332061767578125, -0.293548583984375, -0.2538909912109375, -0.2142333984375, -0.1745758056640625, -0.134918212890625, -0.0952606201171875, -0.05560302734375, -0.0159454345703125, 0.023712158203125, 0.0633697509765625, 0.10302734375, 0.1426849365234375, 0.182342529296875, 0.2220001220703125, 0.26165771484375, 0.3013153076171875, 0.340972900390625, 0.3806304931640625, 0.4202880859375, 0.4599456787109375, 0.499603271484375, 0.5392608642578125, 0.57891845703125, 0.6185760498046875, 0.658233642578125, 0.6978912353515625, 0.737548828125, 0.7772064208984375, 0.816864013671875, 0.8565216064453125, 0.89617919921875, 0.9358367919921875, 0.975494384765625, 1.0151519775390625, 1.0548095703125, 1.0944671630859375, 1.134124755859375, 1.1737823486328125, 1.21343994140625, 1.2530975341796875, 1.292755126953125, 1.3324127197265625, 1.3720703125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 9.0, 14.0, 23.0, 44.0, 61.0, 102.0, 124.0, 156.0, 149.0, 98.0, 85.0, 48.0, 26.0, 18.0, 9.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140583038330078, -16.473159790039062, -15.80573558807373, -15.138311386108398, -14.470888137817383, -13.803464889526367, -13.136040687561035, -12.468616485595703, -11.801193237304688, -11.133769989013672, -10.46634578704834, -9.798921585083008, -9.131498336791992, -8.464075088500977, -7.7966508865356445, -7.129227161407471, -6.461803436279297, -5.794379711151123, -5.126955986022949, -4.459532260894775, -3.7921085357666016, -3.1246848106384277, -2.457261085510254, -1.78983736038208, -1.1224136352539062, -0.4549899101257324, 0.2124338150024414, 0.8798575401306152, 1.547281265258789, 2.214704990386963, 2.8821287155151367, 3.5495524406433105, 4.216974258422852, 4.884397983551025, 5.551821708679199, 6.219245433807373, 6.886669158935547, 7.554092884063721, 8.221516609191895, 8.888940811157227, 9.556364059448242, 10.223787307739258, 10.89121150970459, 11.558635711669922, 12.226058959960938, 12.893482208251953, 13.560906410217285, 14.228330612182617, 14.895753860473633, 15.563177108764648, 16.230602264404297, 16.898025512695312, 17.565448760986328, 18.232872009277344, 18.90029525756836, 19.567720413208008, 20.235143661499023, 20.90256690979004, 21.569992065429688, 22.237415313720703, 22.90483856201172, 23.572261810302734, 24.23968505859375, 24.9071102142334, 25.574533462524414]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 1.0, 3.0, 4.0, 5.0, 8.0, 4.0, 10.0, 8.0, 6.0, 16.0, 22.0, 19.0, 31.0, 23.0, 26.0, 28.0, 32.0, 28.0, 34.0, 36.0, 43.0, 39.0, 40.0, 25.0, 41.0, 42.0, 38.0, 43.0, 40.0, 26.0, 34.0, 32.0, 35.0, 28.0, 30.0, 20.0, 19.0, 23.0, 14.0, 11.0, 8.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.676050186157227, -14.19009780883789, -13.704145431518555, -13.218193054199219, -12.732240676879883, -12.246288299560547, -11.760335922241211, -11.274383544921875, -10.788431167602539, -10.302478790283203, -9.816526412963867, -9.330574035644531, -8.844621658325195, -8.35866928100586, -7.872716903686523, -7.3867645263671875, -6.900811672210693, -6.414859294891357, -5.9289069175720215, -5.4429545402526855, -4.95700216293335, -4.4710493087768555, -3.9850971698760986, -3.4991447925567627, -3.0131924152374268, -2.527240037918091, -2.041287660598755, -1.5553351640701294, -1.0693827867507935, -0.583430290222168, -0.09747791290283203, 0.3884744644165039, 0.8744268417358398, 1.3603792190551758, 1.8463315963745117, 2.3322839736938477, 2.8182363510131836, 3.3041889667510986, 3.7901413440704346, 4.276093482971191, 4.762045860290527, 5.247998237609863, 5.733950614929199, 6.219902992248535, 6.705855369567871, 7.191807746887207, 7.677760124206543, 8.163712501525879, 8.649665832519531, 9.135618209838867, 9.621570587158203, 10.107522964477539, 10.593475341796875, 11.079427719116211, 11.565380096435547, 12.051332473754883, 12.537284851074219, 13.023237228393555, 13.50918960571289, 13.995141983032227, 14.481094360351562, 14.967046737670898, 15.452999114990234, 15.93895149230957, 16.424903869628906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 10.0, 9.0, 18.0, 20.0, 25.0, 42.0, 59.0, 106.0, 160.0, 268.0, 421.0, 673.0, 1222.0, 2182.0, 3908.0, 7873.0, 15596.0, 33879.0, 79159.0, 193539.0, 467762.0, 960540.0, 1181459.0, 715037.0, 309408.0, 123302.0, 51089.0, 22632.0, 10950.0, 5566.0, 2926.0, 1725.0, 947.0, 616.0, 389.0, 225.0, 163.0, 114.0, 62.0, 60.0, 36.0, 23.0, 26.0, 16.0, 8.0, 9.0, 7.0, 3.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4501953125, -1.3949737548828125, -1.339752197265625, -1.2845306396484375, -1.22930908203125, -1.1740875244140625, -1.118865966796875, -1.0636444091796875, -1.0084228515625, -0.9532012939453125, -0.897979736328125, -0.8427581787109375, -0.78753662109375, -0.7323150634765625, -0.677093505859375, -0.6218719482421875, -0.566650390625, -0.5114288330078125, -0.456207275390625, -0.4009857177734375, -0.34576416015625, -0.2905426025390625, -0.235321044921875, -0.1800994873046875, -0.1248779296875, -0.0696563720703125, -0.014434814453125, 0.0407867431640625, 0.09600830078125, 0.1512298583984375, 0.206451416015625, 0.2616729736328125, 0.31689453125, 0.3721160888671875, 0.427337646484375, 0.4825592041015625, 0.53778076171875, 0.5930023193359375, 0.648223876953125, 0.7034454345703125, 0.7586669921875, 0.8138885498046875, 0.869110107421875, 0.9243316650390625, 0.97955322265625, 1.0347747802734375, 1.089996337890625, 1.1452178955078125, 1.200439453125, 1.2556610107421875, 1.310882568359375, 1.3661041259765625, 1.42132568359375, 1.4765472412109375, 1.531768798828125, 1.5869903564453125, 1.6422119140625, 1.6974334716796875, 1.752655029296875, 1.8078765869140625, 1.86309814453125, 1.9183197021484375, 1.973541259765625, 2.0287628173828125, 2.083984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 10.0, 10.0, 7.0, 14.0, 16.0, 17.0, 28.0, 28.0, 27.0, 27.0, 47.0, 33.0, 51.0, 41.0, 50.0, 44.0, 56.0, 49.0, 39.0, 42.0, 41.0, 44.0, 36.0, 34.0, 29.0, 28.0, 19.0, 26.0, 19.0, 16.0, 14.0, 12.0, 8.0, 5.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.302734375, -2.230224609375, -2.15771484375, -2.085205078125, -2.0126953125, -1.940185546875, -1.86767578125, -1.795166015625, -1.72265625, -1.650146484375, -1.57763671875, -1.505126953125, -1.4326171875, -1.360107421875, -1.28759765625, -1.215087890625, -1.142578125, -1.070068359375, -0.99755859375, -0.925048828125, -0.8525390625, -0.780029296875, -0.70751953125, -0.635009765625, -0.5625, -0.489990234375, -0.41748046875, -0.344970703125, -0.2724609375, -0.199951171875, -0.12744140625, -0.054931640625, 0.017578125, 0.090087890625, 0.16259765625, 0.235107421875, 0.3076171875, 0.380126953125, 0.45263671875, 0.525146484375, 0.59765625, 0.670166015625, 0.74267578125, 0.815185546875, 0.8876953125, 0.960205078125, 1.03271484375, 1.105224609375, 1.177734375, 1.250244140625, 1.32275390625, 1.395263671875, 1.4677734375, 1.540283203125, 1.61279296875, 1.685302734375, 1.7578125, 1.830322265625, 1.90283203125, 1.975341796875, 2.0478515625, 2.120361328125, 2.19287109375, 2.265380859375, 2.337890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 10.0, 7.0, 17.0, 15.0, 31.0, 35.0, 39.0, 71.0, 116.0, 144.0, 254.0, 401.0, 634.0, 1205.0, 2285.0, 4702.0, 10487.0, 26513.0, 74996.0, 244695.0, 1015922.0, 1997200.0, 575616.0, 154650.0, 50058.0, 18545.0, 7740.0, 3573.0, 1802.0, 998.0, 558.0, 322.0, 222.0, 129.0, 82.0, 54.0, 36.0, 26.0, 24.0, 14.0, 11.0, 13.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-3.130859375, -3.03961181640625, -2.9483642578125, -2.85711669921875, -2.765869140625, -2.67462158203125, -2.5833740234375, -2.49212646484375, -2.40087890625, -2.30963134765625, -2.2183837890625, -2.12713623046875, -2.035888671875, -1.94464111328125, -1.8533935546875, -1.76214599609375, -1.6708984375, -1.57965087890625, -1.4884033203125, -1.39715576171875, -1.305908203125, -1.21466064453125, -1.1234130859375, -1.03216552734375, -0.94091796875, -0.84967041015625, -0.7584228515625, -0.66717529296875, -0.575927734375, -0.48468017578125, -0.3934326171875, -0.30218505859375, -0.2109375, -0.11968994140625, -0.0284423828125, 0.06280517578125, 0.154052734375, 0.24530029296875, 0.3365478515625, 0.42779541015625, 0.51904296875, 0.61029052734375, 0.7015380859375, 0.79278564453125, 0.884033203125, 0.97528076171875, 1.0665283203125, 1.15777587890625, 1.2490234375, 1.34027099609375, 1.4315185546875, 1.52276611328125, 1.614013671875, 1.70526123046875, 1.7965087890625, 1.88775634765625, 1.97900390625, 2.07025146484375, 2.1614990234375, 2.25274658203125, 2.343994140625, 2.43524169921875, 2.5264892578125, 2.61773681640625, 2.708984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 19.0, 22.0, 25.0, 35.0, 30.0, 43.0, 69.0, 102.0, 162.0, 189.0, 299.0, 390.0, 530.0, 559.0, 454.0, 308.0, 245.0, 158.0, 109.0, 54.0, 56.0, 53.0, 26.0, 29.0, 13.0, 21.0, 14.0, 4.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.6953125, -3.57666015625, -3.4580078125, -3.33935546875, -3.220703125, -3.10205078125, -2.9833984375, -2.86474609375, -2.74609375, -2.62744140625, -2.5087890625, -2.39013671875, -2.271484375, -2.15283203125, -2.0341796875, -1.91552734375, -1.796875, -1.67822265625, -1.5595703125, -1.44091796875, -1.322265625, -1.20361328125, -1.0849609375, -0.96630859375, -0.84765625, -0.72900390625, -0.6103515625, -0.49169921875, -0.373046875, -0.25439453125, -0.1357421875, -0.01708984375, 0.1015625, 0.22021484375, 0.3388671875, 0.45751953125, 0.576171875, 0.69482421875, 0.8134765625, 0.93212890625, 1.05078125, 1.16943359375, 1.2880859375, 1.40673828125, 1.525390625, 1.64404296875, 1.7626953125, 1.88134765625, 2.0, 2.11865234375, 2.2373046875, 2.35595703125, 2.474609375, 2.59326171875, 2.7119140625, 2.83056640625, 2.94921875, 3.06787109375, 3.1865234375, 3.30517578125, 3.423828125, 3.54248046875, 3.6611328125, 3.77978515625, 3.8984375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 31.0, 119.0, 229.0, 303.0, 199.0, 73.0, 24.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.60888671875, -66.94815063476562, -65.28742218017578, -63.626686096191406, -61.96595001220703, -60.30521774291992, -58.64448547363281, -56.98374938964844, -55.32301330566406, -53.66228103637695, -52.00154495239258, -50.34081268310547, -48.680076599121094, -47.019344329833984, -45.358612060546875, -43.6978759765625, -42.03714370727539, -40.37641143798828, -38.715675354003906, -37.0549430847168, -35.39420700073242, -33.73347473144531, -32.07273864746094, -30.412006378173828, -28.751272201538086, -27.090538024902344, -25.4298038482666, -23.76906967163086, -22.10833740234375, -20.447601318359375, -18.786869049072266, -17.126134872436523, -15.465404510498047, -13.804670333862305, -12.143936157226562, -10.483202934265137, -8.822468757629395, -7.161734580993652, -5.501001358032227, -3.8402671813964844, -2.179533004760742, -0.5187990665435791, 1.141934871673584, 2.802668571472168, 4.46340274810791, 6.124136924743652, 7.784870147705078, 9.44560432434082, 11.106338500976562, 12.767072677612305, 14.427806854248047, 16.088539123535156, 17.74927520751953, 19.41000747680664, 21.070741653442383, 22.731475830078125, 24.392210006713867, 26.05294418334961, 27.71367835998535, 29.374412536621094, 31.035144805908203, 32.69588088989258, 34.35661315917969, 36.01734924316406, 37.67808151245117]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 11.0, 13.0, 17.0, 17.0, 23.0, 17.0, 27.0, 25.0, 30.0, 39.0, 32.0, 61.0, 45.0, 38.0, 41.0, 39.0, 49.0, 57.0, 49.0, 47.0, 38.0, 34.0, 43.0, 25.0, 28.0, 40.0, 21.0, 14.0, 13.0, 6.0, 9.0, 10.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.223922729492188, -14.78917407989502, -14.354426383972168, -13.919677734375, -13.484930038452148, -13.05018138885498, -12.615432739257812, -12.180685043334961, -11.74593734741211, -11.311188697814941, -10.87644100189209, -10.441692352294922, -10.00694465637207, -9.572196006774902, -9.137447357177734, -8.702699661254883, -8.267951011657715, -7.833202838897705, -7.398454666137695, -6.963706016540527, -6.528958320617676, -6.094209671020508, -5.659461498260498, -5.224713325500488, -4.7899651527404785, -4.355216979980469, -3.920468807220459, -3.48572039604187, -3.0509722232818604, -2.6162240505218506, -2.1814756393432617, -1.746727466583252, -1.3119792938232422, -0.8772310614585876, -0.4424828290939331, -0.007734537124633789, 0.427013635635376, 0.8617618083953857, 1.2965102195739746, 1.7312583923339844, 2.166006565093994, 2.600754737854004, 3.0355029106140137, 3.4702513217926025, 3.9049994945526123, 4.339747428894043, 4.774496078491211, 5.209244251251221, 5.6439924240112305, 6.07874059677124, 6.51348876953125, 6.948237419128418, 7.3829851150512695, 7.8177337646484375, 8.252481460571289, 8.687230110168457, 9.121978759765625, 9.556727409362793, 9.991475105285645, 10.426223754882812, 10.860971450805664, 11.295720100402832, 11.73046875, 12.165216445922852, 12.599964141845703]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 9.0, 10.0, 11.0, 22.0, 42.0, 43.0, 94.0, 207.0, 381.0, 693.0, 1352.0, 2537.0, 4841.0, 9356.0, 21045.0, 63905.0, 228765.0, 407995.0, 210596.0, 58439.0, 19435.0, 9038.0, 4554.0, 2450.0, 1254.0, 700.0, 349.0, 182.0, 98.0, 55.0, 36.0, 29.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.9901123046875, -3.859130859375, -3.7281494140625, -3.59716796875, -3.4661865234375, -3.335205078125, -3.2042236328125, -3.0732421875, -2.9422607421875, -2.811279296875, -2.6802978515625, -2.54931640625, -2.4183349609375, -2.287353515625, -2.1563720703125, -2.025390625, -1.8944091796875, -1.763427734375, -1.6324462890625, -1.50146484375, -1.3704833984375, -1.239501953125, -1.1085205078125, -0.9775390625, -0.8465576171875, -0.715576171875, -0.5845947265625, -0.45361328125, -0.3226318359375, -0.191650390625, -0.0606689453125, 0.0703125, 0.2012939453125, 0.332275390625, 0.4632568359375, 0.59423828125, 0.7252197265625, 0.856201171875, 0.9871826171875, 1.1181640625, 1.2491455078125, 1.380126953125, 1.5111083984375, 1.64208984375, 1.7730712890625, 1.904052734375, 2.0350341796875, 2.166015625, 2.2969970703125, 2.427978515625, 2.5589599609375, 2.68994140625, 2.8209228515625, 2.951904296875, 3.0828857421875, 3.2138671875, 3.3448486328125, 3.475830078125, 3.6068115234375, 3.73779296875, 3.8687744140625, 3.999755859375, 4.1307373046875, 4.26171875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 10.0, 14.0, 12.0, 21.0, 31.0, 28.0, 26.0, 29.0, 29.0, 29.0, 32.0, 35.0, 38.0, 49.0, 50.0, 45.0, 47.0, 41.0, 49.0, 29.0, 39.0, 34.0, 32.0, 37.0, 33.0, 24.0, 16.0, 25.0, 24.0, 8.0, 11.0, 10.0, 12.0, 6.0, 8.0, 2.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.17578125, -2.105377197265625, -2.03497314453125, -1.964569091796875, -1.8941650390625, -1.823760986328125, -1.75335693359375, -1.682952880859375, -1.612548828125, -1.542144775390625, -1.47174072265625, -1.401336669921875, -1.3309326171875, -1.260528564453125, -1.19012451171875, -1.119720458984375, -1.04931640625, -0.978912353515625, -0.90850830078125, -0.838104248046875, -0.7677001953125, -0.697296142578125, -0.62689208984375, -0.556488037109375, -0.486083984375, -0.415679931640625, -0.34527587890625, -0.274871826171875, -0.2044677734375, -0.134063720703125, -0.06365966796875, 0.006744384765625, 0.0771484375, 0.147552490234375, 0.21795654296875, 0.288360595703125, 0.3587646484375, 0.429168701171875, 0.49957275390625, 0.569976806640625, 0.640380859375, 0.710784912109375, 0.78118896484375, 0.851593017578125, 0.9219970703125, 0.992401123046875, 1.06280517578125, 1.133209228515625, 1.20361328125, 1.274017333984375, 1.34442138671875, 1.414825439453125, 1.4852294921875, 1.555633544921875, 1.62603759765625, 1.696441650390625, 1.766845703125, 1.837249755859375, 1.90765380859375, 1.978057861328125, 2.0484619140625, 2.118865966796875, 2.18927001953125, 2.259674072265625, 2.330078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 14.0, 21.0, 23.0, 42.0, 33.0, 77.0, 92.0, 146.0, 232.0, 356.0, 620.0, 1014.0, 1818.0, 3076.0, 5663.0, 10668.0, 21017.0, 47880.0, 119823.0, 265087.0, 299836.0, 155660.0, 60941.0, 26018.0, 12756.0, 6658.0, 3779.0, 2141.0, 1192.0, 675.0, 430.0, 237.0, 155.0, 108.0, 67.0, 54.0, 33.0, 25.0, 25.0, 11.0, 10.0, 6.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.150390625, -3.055328369140625, -2.96026611328125, -2.865203857421875, -2.7701416015625, -2.675079345703125, -2.58001708984375, -2.484954833984375, -2.389892578125, -2.294830322265625, -2.19976806640625, -2.104705810546875, -2.0096435546875, -1.914581298828125, -1.81951904296875, -1.724456787109375, -1.62939453125, -1.534332275390625, -1.43927001953125, -1.344207763671875, -1.2491455078125, -1.154083251953125, -1.05902099609375, -0.963958740234375, -0.868896484375, -0.773834228515625, -0.67877197265625, -0.583709716796875, -0.4886474609375, -0.393585205078125, -0.29852294921875, -0.203460693359375, -0.1083984375, -0.013336181640625, 0.08172607421875, 0.176788330078125, 0.2718505859375, 0.366912841796875, 0.46197509765625, 0.557037353515625, 0.652099609375, 0.747161865234375, 0.84222412109375, 0.937286376953125, 1.0323486328125, 1.127410888671875, 1.22247314453125, 1.317535400390625, 1.41259765625, 1.507659912109375, 1.60272216796875, 1.697784423828125, 1.7928466796875, 1.887908935546875, 1.98297119140625, 2.078033447265625, 2.173095703125, 2.268157958984375, 2.36322021484375, 2.458282470703125, 2.5533447265625, 2.648406982421875, 2.74346923828125, 2.838531494140625, 2.93359375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 7.0, 3.0, 4.0, 7.0, 8.0, 8.0, 9.0, 9.0, 14.0, 18.0, 12.0, 14.0, 16.0, 31.0, 21.0, 22.0, 25.0, 23.0, 38.0, 31.0, 35.0, 32.0, 38.0, 38.0, 42.0, 35.0, 37.0, 45.0, 34.0, 28.0, 35.0, 30.0, 30.0, 30.0, 17.0, 16.0, 34.0, 15.0, 16.0, 10.0, 9.0, 15.0, 10.0, 8.0, 9.0, 7.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 4.0, 4.0], "bins": [-6.09375, -5.91748046875, -5.7412109375, -5.56494140625, -5.388671875, -5.21240234375, -5.0361328125, -4.85986328125, -4.68359375, -4.50732421875, -4.3310546875, -4.15478515625, -3.978515625, -3.80224609375, -3.6259765625, -3.44970703125, -3.2734375, -3.09716796875, -2.9208984375, -2.74462890625, -2.568359375, -2.39208984375, -2.2158203125, -2.03955078125, -1.86328125, -1.68701171875, -1.5107421875, -1.33447265625, -1.158203125, -0.98193359375, -0.8056640625, -0.62939453125, -0.453125, -0.27685546875, -0.1005859375, 0.07568359375, 0.251953125, 0.42822265625, 0.6044921875, 0.78076171875, 0.95703125, 1.13330078125, 1.3095703125, 1.48583984375, 1.662109375, 1.83837890625, 2.0146484375, 2.19091796875, 2.3671875, 2.54345703125, 2.7197265625, 2.89599609375, 3.072265625, 3.24853515625, 3.4248046875, 3.60107421875, 3.77734375, 3.95361328125, 4.1298828125, 4.30615234375, 4.482421875, 4.65869140625, 4.8349609375, 5.01123046875, 5.1875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 6.0, 10.0, 5.0, 5.0, 10.0, 19.0, 30.0, 36.0, 57.0, 66.0, 100.0, 153.0, 222.0, 284.0, 434.0, 648.0, 989.0, 1558.0, 2592.0, 4118.0, 6990.0, 12902.0, 24570.0, 49570.0, 112856.0, 229507.0, 277342.0, 169370.0, 76723.0, 35485.0, 17837.0, 9621.0, 5572.0, 3185.0, 1900.0, 1247.0, 839.0, 521.0, 369.0, 285.0, 164.0, 108.0, 87.0, 63.0, 26.0, 24.0, 23.0, 14.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.89501953125, -0.8644332885742188, -0.8338470458984375, -0.8032608032226562, -0.772674560546875, -0.7420883178710938, -0.7115020751953125, -0.6809158325195312, -0.65032958984375, -0.6197433471679688, -0.5891571044921875, -0.5585708618164062, -0.527984619140625, -0.49739837646484375, -0.4668121337890625, -0.43622589111328125, -0.4056396484375, -0.37505340576171875, -0.3444671630859375, -0.31388092041015625, -0.283294677734375, -0.25270843505859375, -0.2221221923828125, -0.19153594970703125, -0.16094970703125, -0.13036346435546875, -0.0997772216796875, -0.06919097900390625, -0.038604736328125, -0.00801849365234375, 0.0225677490234375, 0.05315399169921875, 0.083740234375, 0.11432647705078125, 0.1449127197265625, 0.17549896240234375, 0.206085205078125, 0.23667144775390625, 0.2672576904296875, 0.29784393310546875, 0.32843017578125, 0.35901641845703125, 0.3896026611328125, 0.42018890380859375, 0.450775146484375, 0.48136138916015625, 0.5119476318359375, 0.5425338745117188, 0.5731201171875, 0.6037063598632812, 0.6342926025390625, 0.6648788452148438, 0.695465087890625, 0.7260513305664062, 0.7566375732421875, 0.7872238159179688, 0.81781005859375, 0.8483963012695312, 0.8789825439453125, 0.9095687866210938, 0.940155029296875, 0.9707412719726562, 1.0013275146484375, 1.0319137573242188, 1.0625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 7.0, 3.0, 9.0, 11.0, 15.0, 18.0, 29.0, 51.0, 49.0, 83.0, 102.0, 122.0, 99.0, 103.0, 80.0, 62.0, 38.0, 19.0, 26.0, 10.0, 8.0, 6.0, 9.0, 9.0, 4.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003757476806640625, -0.0003598928451538086, -0.0003440380096435547, -0.0003281831741333008, -0.0003123283386230469, -0.00029647350311279297, -0.00028061866760253906, -0.00026476383209228516, -0.00024890899658203125, -0.00023305416107177734, -0.00021719932556152344, -0.00020134449005126953, -0.00018548965454101562, -0.00016963481903076172, -0.0001537799835205078, -0.0001379251480102539, -0.0001220703125, -0.0001062154769897461, -9.036064147949219e-05, -7.450580596923828e-05, -5.8650970458984375e-05, -4.279613494873047e-05, -2.6941299438476562e-05, -1.1086463928222656e-05, 4.76837158203125e-06, 2.0623207092285156e-05, 3.647804260253906e-05, 5.233287811279297e-05, 6.818771362304688e-05, 8.404254913330078e-05, 9.989738464355469e-05, 0.0001157522201538086, 0.0001316070556640625, 0.0001474618911743164, 0.0001633167266845703, 0.00017917156219482422, 0.00019502639770507812, 0.00021088123321533203, 0.00022673606872558594, 0.00024259090423583984, 0.00025844573974609375, 0.00027430057525634766, 0.00029015541076660156, 0.00030601024627685547, 0.0003218650817871094, 0.0003377199172973633, 0.0003535747528076172, 0.0003694295883178711, 0.000385284423828125, 0.0004011392593383789, 0.0004169940948486328, 0.0004328489303588867, 0.0004487037658691406, 0.00046455860137939453, 0.00048041343688964844, 0.0004962682723999023, 0.0005121231079101562, 0.0005279779434204102, 0.0005438327789306641, 0.000559687614440918, 0.0005755424499511719, 0.0005913972854614258, 0.0006072521209716797, 0.0006231069564819336, 0.0006389617919921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 10.0, 12.0, 13.0, 32.0, 44.0, 101.0, 159.0, 274.0, 533.0, 1101.0, 2331.0, 5823.0, 15764.0, 49342.0, 158977.0, 356844.0, 296839.0, 108467.0, 33001.0, 11146.0, 4282.0, 1732.0, 846.0, 379.0, 202.0, 105.0, 83.0, 38.0, 21.0, 20.0, 11.0, 2.0, 7.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5078125, -1.4645233154296875, -1.421234130859375, -1.3779449462890625, -1.33465576171875, -1.2913665771484375, -1.248077392578125, -1.2047882080078125, -1.1614990234375, -1.1182098388671875, -1.074920654296875, -1.0316314697265625, -0.98834228515625, -0.9450531005859375, -0.901763916015625, -0.8584747314453125, -0.815185546875, -0.7718963623046875, -0.728607177734375, -0.6853179931640625, -0.64202880859375, -0.5987396240234375, -0.555450439453125, -0.5121612548828125, -0.4688720703125, -0.4255828857421875, -0.382293701171875, -0.3390045166015625, -0.29571533203125, -0.2524261474609375, -0.209136962890625, -0.1658477783203125, -0.12255859375, -0.0792694091796875, -0.035980224609375, 0.0073089599609375, 0.05059814453125, 0.0938873291015625, 0.137176513671875, 0.1804656982421875, 0.2237548828125, 0.2670440673828125, 0.310333251953125, 0.3536224365234375, 0.39691162109375, 0.4402008056640625, 0.483489990234375, 0.5267791748046875, 0.570068359375, 0.6133575439453125, 0.656646728515625, 0.6999359130859375, 0.74322509765625, 0.7865142822265625, 0.829803466796875, 0.8730926513671875, 0.9163818359375, 0.9596710205078125, 1.002960205078125, 1.0462493896484375, 1.08953857421875, 1.1328277587890625, 1.176116943359375, 1.2194061279296875, 1.2626953125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 5.0, 5.0, 9.0, 6.0, 19.0, 20.0, 19.0, 32.0, 44.0, 34.0, 63.0, 68.0, 72.0, 75.0, 81.0, 60.0, 61.0, 53.0, 56.0, 39.0, 31.0, 33.0, 26.0, 26.0, 21.0, 9.0, 5.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.360076904296875, -1.31195068359375, -1.263824462890625, -1.2156982421875, -1.167572021484375, -1.11944580078125, -1.071319580078125, -1.023193359375, -0.975067138671875, -0.92694091796875, -0.878814697265625, -0.8306884765625, -0.782562255859375, -0.73443603515625, -0.686309814453125, -0.63818359375, -0.590057373046875, -0.54193115234375, -0.493804931640625, -0.4456787109375, -0.397552490234375, -0.34942626953125, -0.301300048828125, -0.253173828125, -0.205047607421875, -0.15692138671875, -0.108795166015625, -0.0606689453125, -0.012542724609375, 0.03558349609375, 0.083709716796875, 0.1318359375, 0.179962158203125, 0.22808837890625, 0.276214599609375, 0.3243408203125, 0.372467041015625, 0.42059326171875, 0.468719482421875, 0.516845703125, 0.564971923828125, 0.61309814453125, 0.661224365234375, 0.7093505859375, 0.757476806640625, 0.80560302734375, 0.853729248046875, 0.90185546875, 0.949981689453125, 0.99810791015625, 1.046234130859375, 1.0943603515625, 1.142486572265625, 1.19061279296875, 1.238739013671875, 1.286865234375, 1.334991455078125, 1.38311767578125, 1.431243896484375, 1.4793701171875, 1.527496337890625, 1.57562255859375, 1.623748779296875, 1.671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 28.0, 71.0, 135.0, 185.0, 208.0, 144.0, 100.0, 47.0, 29.0, 18.0, 6.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.418155670166016, -18.450836181640625, -17.483516693115234, -16.516197204589844, -15.54887866973877, -14.581559181213379, -13.614239692687988, -12.646921157836914, -11.679601669311523, -10.712282180786133, -9.744962692260742, -8.777643203735352, -7.810324668884277, -6.843005180358887, -5.875685691833496, -4.908366680145264, -3.941046714782715, -2.9737274646759033, -2.006408214569092, -1.0390887260437012, -0.07176947593688965, 0.8955497741699219, 1.8628692626953125, 2.830188274383545, 3.7975077629089355, 4.764827251434326, 5.732146263122559, 6.699465751647949, 7.66678524017334, 8.634103775024414, 9.601423263549805, 10.568742752075195, 11.536062240600586, 12.503381729125977, 13.470701217651367, 14.438020706176758, 15.405339241027832, 16.372657775878906, 17.339977264404297, 18.307296752929688, 19.274616241455078, 20.24193572998047, 21.20925521850586, 22.17657470703125, 23.14389419555664, 24.11121368408203, 25.078533172607422, 26.04585075378418, 27.013172149658203, 27.980491638183594, 28.947811126708984, 29.915130615234375, 30.882450103759766, 31.849769592285156, 32.81708908081055, 33.78440856933594, 34.75172424316406, 35.71904373168945, 36.686363220214844, 37.653682708740234, 38.621002197265625, 39.588321685791016, 40.555641174316406, 41.5229606628418, 42.49028015136719]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 6.0, 6.0, 4.0, 4.0, 6.0, 6.0, 16.0, 14.0, 16.0, 18.0, 24.0, 31.0, 37.0, 29.0, 43.0, 35.0, 35.0, 47.0, 50.0, 49.0, 42.0, 43.0, 39.0, 44.0, 43.0, 45.0, 35.0, 37.0, 34.0, 31.0, 25.0, 19.0, 18.0, 20.0, 10.0, 15.0, 6.0, 12.0, 5.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.74022102355957, -17.246177673339844, -16.752134323120117, -16.258092880249023, -15.764049530029297, -15.27000617980957, -14.775962829589844, -14.281919479370117, -13.787877082824707, -13.29383373260498, -12.79979133605957, -12.305747985839844, -11.811704635620117, -11.317662239074707, -10.82361888885498, -10.32957649230957, -9.835533142089844, -9.341489791870117, -8.847447395324707, -8.35340404510498, -7.859361171722412, -7.365318298339844, -6.871274948120117, -6.377232074737549, -5.8831892013549805, -5.389146327972412, -4.895103454589844, -4.401060104370117, -3.907017230987549, -3.4129743576049805, -2.918931245803833, -2.4248881340026855, -1.9308443069458008, -1.4368013143539429, -0.942758321762085, -0.44871532917022705, 0.04532766342163086, 0.5393705368041992, 1.0334136486053467, 1.5274567604064941, 2.0214996337890625, 2.515542507171631, 3.0095856189727783, 3.503628730773926, 3.997671604156494, 4.4917144775390625, 4.985757827758789, 5.479800701141357, 5.973843574523926, 6.467886447906494, 6.9619293212890625, 7.455972671508789, 7.950015544891357, 8.444058418273926, 8.938101768493652, 9.432144165039062, 9.926187515258789, 10.420230865478516, 10.914273262023926, 11.408316612243652, 11.902359008789062, 12.396402359008789, 12.890445709228516, 13.384489059448242, 13.878531455993652]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 8.0, 14.0, 21.0, 33.0, 59.0, 131.0, 190.0, 390.0, 813.0, 1660.0, 3683.0, 8827.0, 24073.0, 74142.0, 258599.0, 771657.0, 1431802.0, 1054074.0, 397042.0, 113718.0, 33083.0, 11424.0, 4588.0, 2065.0, 984.0, 502.0, 262.0, 152.0, 90.0, 58.0, 47.0, 30.0, 14.0, 16.0, 13.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9287109375, -1.8536224365234375, -1.778533935546875, -1.7034454345703125, -1.62835693359375, -1.5532684326171875, -1.478179931640625, -1.4030914306640625, -1.3280029296875, -1.2529144287109375, -1.177825927734375, -1.1027374267578125, -1.02764892578125, -0.9525604248046875, -0.877471923828125, -0.8023834228515625, -0.727294921875, -0.6522064208984375, -0.577117919921875, -0.5020294189453125, -0.42694091796875, -0.3518524169921875, -0.276763916015625, -0.2016754150390625, -0.1265869140625, -0.0514984130859375, 0.023590087890625, 0.0986785888671875, 0.17376708984375, 0.2488555908203125, 0.323944091796875, 0.3990325927734375, 0.47412109375, 0.5492095947265625, 0.624298095703125, 0.6993865966796875, 0.77447509765625, 0.8495635986328125, 0.924652099609375, 0.9997406005859375, 1.0748291015625, 1.1499176025390625, 1.225006103515625, 1.3000946044921875, 1.37518310546875, 1.4502716064453125, 1.525360107421875, 1.6004486083984375, 1.675537109375, 1.7506256103515625, 1.825714111328125, 1.9008026123046875, 1.97589111328125, 2.0509796142578125, 2.126068115234375, 2.2011566162109375, 2.2762451171875, 2.3513336181640625, 2.426422119140625, 2.5015106201171875, 2.57659912109375, 2.6516876220703125, 2.726776123046875, 2.8018646240234375, 2.876953125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 3.0, 12.0, 9.0, 8.0, 7.0, 17.0, 19.0, 17.0, 21.0, 23.0, 28.0, 28.0, 30.0, 26.0, 33.0, 52.0, 41.0, 47.0, 40.0, 42.0, 40.0, 42.0, 49.0, 35.0, 36.0, 37.0, 32.0, 25.0, 22.0, 22.0, 21.0, 21.0, 18.0, 18.0, 14.0, 9.0, 15.0, 8.0, 4.0, 7.0, 7.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.865234375, -1.797760009765625, -1.73028564453125, -1.662811279296875, -1.5953369140625, -1.527862548828125, -1.46038818359375, -1.392913818359375, -1.325439453125, -1.257965087890625, -1.19049072265625, -1.123016357421875, -1.0555419921875, -0.988067626953125, -0.92059326171875, -0.853118896484375, -0.78564453125, -0.718170166015625, -0.65069580078125, -0.583221435546875, -0.5157470703125, -0.448272705078125, -0.38079833984375, -0.313323974609375, -0.245849609375, -0.178375244140625, -0.11090087890625, -0.043426513671875, 0.0240478515625, 0.091522216796875, 0.15899658203125, 0.226470947265625, 0.2939453125, 0.361419677734375, 0.42889404296875, 0.496368408203125, 0.5638427734375, 0.631317138671875, 0.69879150390625, 0.766265869140625, 0.833740234375, 0.901214599609375, 0.96868896484375, 1.036163330078125, 1.1036376953125, 1.171112060546875, 1.23858642578125, 1.306060791015625, 1.37353515625, 1.441009521484375, 1.50848388671875, 1.575958251953125, 1.6434326171875, 1.710906982421875, 1.77838134765625, 1.845855712890625, 1.913330078125, 1.980804443359375, 2.04827880859375, 2.115753173828125, 2.1832275390625, 2.250701904296875, 2.31817626953125, 2.385650634765625, 2.453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 9.0, 6.0, 13.0, 13.0, 17.0, 32.0, 45.0, 50.0, 103.0, 135.0, 251.0, 405.0, 722.0, 1261.0, 2353.0, 4648.0, 9595.0, 21962.0, 54348.0, 151200.0, 484775.0, 1564779.0, 1313591.0, 379568.0, 123105.0, 45457.0, 18466.0, 8477.0, 4056.0, 2046.0, 1148.0, 623.0, 327.0, 239.0, 181.0, 108.0, 66.0, 33.0, 19.0, 19.0, 9.0, 9.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.544921875, -2.46514892578125, -2.3853759765625, -2.30560302734375, -2.225830078125, -2.14605712890625, -2.0662841796875, -1.98651123046875, -1.90673828125, -1.82696533203125, -1.7471923828125, -1.66741943359375, -1.587646484375, -1.50787353515625, -1.4281005859375, -1.34832763671875, -1.2685546875, -1.18878173828125, -1.1090087890625, -1.02923583984375, -0.949462890625, -0.86968994140625, -0.7899169921875, -0.71014404296875, -0.63037109375, -0.55059814453125, -0.4708251953125, -0.39105224609375, -0.311279296875, -0.23150634765625, -0.1517333984375, -0.07196044921875, 0.0078125, 0.08758544921875, 0.1673583984375, 0.24713134765625, 0.326904296875, 0.40667724609375, 0.4864501953125, 0.56622314453125, 0.64599609375, 0.72576904296875, 0.8055419921875, 0.88531494140625, 0.965087890625, 1.04486083984375, 1.1246337890625, 1.20440673828125, 1.2841796875, 1.36395263671875, 1.4437255859375, 1.52349853515625, 1.603271484375, 1.68304443359375, 1.7628173828125, 1.84259033203125, 1.92236328125, 2.00213623046875, 2.0819091796875, 2.16168212890625, 2.241455078125, 2.32122802734375, 2.4010009765625, 2.48077392578125, 2.560546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 8.0, 5.0, 4.0, 11.0, 14.0, 24.0, 18.0, 37.0, 42.0, 58.0, 74.0, 79.0, 120.0, 158.0, 204.0, 268.0, 365.0, 448.0, 439.0, 368.0, 315.0, 254.0, 202.0, 127.0, 105.0, 80.0, 58.0, 46.0, 29.0, 28.0, 23.0, 16.0, 12.0, 8.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.884765625, -3.77752685546875, -3.6702880859375, -3.56304931640625, -3.455810546875, -3.34857177734375, -3.2413330078125, -3.13409423828125, -3.02685546875, -2.91961669921875, -2.8123779296875, -2.70513916015625, -2.597900390625, -2.49066162109375, -2.3834228515625, -2.27618408203125, -2.1689453125, -2.06170654296875, -1.9544677734375, -1.84722900390625, -1.739990234375, -1.63275146484375, -1.5255126953125, -1.41827392578125, -1.31103515625, -1.20379638671875, -1.0965576171875, -0.98931884765625, -0.882080078125, -0.77484130859375, -0.6676025390625, -0.56036376953125, -0.453125, -0.34588623046875, -0.2386474609375, -0.13140869140625, -0.024169921875, 0.08306884765625, 0.1903076171875, 0.29754638671875, 0.40478515625, 0.51202392578125, 0.6192626953125, 0.72650146484375, 0.833740234375, 0.94097900390625, 1.0482177734375, 1.15545654296875, 1.2626953125, 1.36993408203125, 1.4771728515625, 1.58441162109375, 1.691650390625, 1.79888916015625, 1.9061279296875, 2.01336669921875, 2.12060546875, 2.22784423828125, 2.3350830078125, 2.44232177734375, 2.549560546875, 2.65679931640625, 2.7640380859375, 2.87127685546875, 2.978515625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 13.0, 24.0, 88.0, 188.0, 261.0, 229.0, 109.0, 48.0, 21.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.3680419921875, -44.945560455322266, -43.5230827331543, -42.10060119628906, -40.678123474121094, -39.25564193725586, -37.833160400390625, -36.410682678222656, -34.98820114135742, -33.56571960449219, -32.14324188232422, -30.720760345458984, -29.298280715942383, -27.87580108642578, -26.453319549560547, -25.030839920043945, -23.608360290527344, -22.185880661010742, -20.76340103149414, -19.340919494628906, -17.918439865112305, -16.495960235595703, -15.073479652404785, -13.650999069213867, -12.228519439697266, -10.806039810180664, -9.383559226989746, -7.961079120635986, -6.538599014282227, -5.116118907928467, -3.693638801574707, -2.271158218383789, -0.8486747741699219, 0.5738053321838379, 1.9962854385375977, 3.4187655448913574, 4.841245651245117, 6.263725757598877, 7.686205863952637, 9.108686447143555, 10.531166076660156, 11.953645706176758, 13.376126289367676, 14.798606872558594, 16.221086502075195, 17.643566131591797, 19.06604766845703, 20.488527297973633, 21.911006927490234, 23.333486557006836, 24.755966186523438, 26.178447723388672, 27.600927352905273, 29.023406982421875, 30.44588851928711, 31.86836814880371, 33.29084777832031, 34.71332931518555, 36.135807037353516, 37.55828857421875, 38.98076629638672, 40.40324783325195, 41.82572937011719, 43.248207092285156, 44.67068862915039]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 7.0, 10.0, 14.0, 10.0, 10.0, 23.0, 20.0, 23.0, 25.0, 36.0, 37.0, 34.0, 32.0, 47.0, 39.0, 40.0, 50.0, 43.0, 57.0, 52.0, 56.0, 52.0, 37.0, 39.0, 34.0, 32.0, 24.0, 22.0, 18.0, 15.0, 12.0, 12.0, 7.0, 12.0, 3.0, 1.0, 3.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.33450984954834, -12.922429084777832, -12.51034927368164, -12.098268508911133, -11.686187744140625, -11.274106979370117, -10.862027168273926, -10.449946403503418, -10.037866592407227, -9.625785827636719, -9.213706016540527, -8.80162525177002, -8.389544486999512, -7.977464199066162, -7.5653839111328125, -7.153303146362305, -6.741222381591797, -6.329142093658447, -5.9170613288879395, -5.50498104095459, -5.092900276184082, -4.680819988250732, -4.268739700317383, -3.856659173965454, -3.4445786476135254, -3.0324981212615967, -2.620417594909668, -2.2083373069763184, -1.7962567806243896, -1.384176254272461, -0.9720959663391113, -0.5600154399871826, -0.1479339599609375, 0.26414650678634644, 0.6762269735336304, 1.0883073806762695, 1.5003879070281982, 1.912468433380127, 2.3245487213134766, 2.7366292476654053, 3.148709774017334, 3.5607903003692627, 3.9728708267211914, 4.384951114654541, 4.797031402587891, 5.209112167358398, 5.621192455291748, 6.033272743225098, 6.4453535079956055, 6.857433795928955, 7.269514560699463, 7.6815948486328125, 8.09367561340332, 8.505756378173828, 8.91783618927002, 9.329916954040527, 9.741996765136719, 10.154077529907227, 10.566157341003418, 10.978238105773926, 11.390318870544434, 11.802398681640625, 12.214479446411133, 12.62656021118164, 13.038640975952148]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 15.0, 29.0, 38.0, 51.0, 98.0, 137.0, 201.0, 325.0, 557.0, 909.0, 1655.0, 3010.0, 6151.0, 14299.0, 44420.0, 155341.0, 363700.0, 302166.0, 104035.0, 29976.0, 10813.0, 4814.0, 2395.0, 1377.0, 800.0, 483.0, 275.0, 180.0, 100.0, 65.0, 45.0, 31.0, 21.0, 12.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.373260498046875, -3.25628662109375, -3.139312744140625, -3.0223388671875, -2.905364990234375, -2.78839111328125, -2.671417236328125, -2.554443359375, -2.437469482421875, -2.32049560546875, -2.203521728515625, -2.0865478515625, -1.969573974609375, -1.85260009765625, -1.735626220703125, -1.61865234375, -1.501678466796875, -1.38470458984375, -1.267730712890625, -1.1507568359375, -1.033782958984375, -0.91680908203125, -0.799835205078125, -0.682861328125, -0.565887451171875, -0.44891357421875, -0.331939697265625, -0.2149658203125, -0.097991943359375, 0.01898193359375, 0.135955810546875, 0.2529296875, 0.369903564453125, 0.48687744140625, 0.603851318359375, 0.7208251953125, 0.837799072265625, 0.95477294921875, 1.071746826171875, 1.188720703125, 1.305694580078125, 1.42266845703125, 1.539642333984375, 1.6566162109375, 1.773590087890625, 1.89056396484375, 2.007537841796875, 2.12451171875, 2.241485595703125, 2.35845947265625, 2.475433349609375, 2.5924072265625, 2.709381103515625, 2.82635498046875, 2.943328857421875, 3.060302734375, 3.177276611328125, 3.29425048828125, 3.411224365234375, 3.5281982421875, 3.645172119140625, 3.76214599609375, 3.879119873046875, 3.99609375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 10.0, 7.0, 9.0, 8.0, 10.0, 15.0, 19.0, 14.0, 18.0, 25.0, 36.0, 28.0, 27.0, 29.0, 30.0, 45.0, 35.0, 40.0, 43.0, 46.0, 43.0, 50.0, 28.0, 35.0, 45.0, 35.0, 30.0, 22.0, 20.0, 21.0, 30.0, 13.0, 28.0, 13.0, 16.0, 14.0, 13.0, 8.0, 11.0, 5.0, 9.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.31640625, -2.24871826171875, -2.1810302734375, -2.11334228515625, -2.045654296875, -1.97796630859375, -1.9102783203125, -1.84259033203125, -1.77490234375, -1.70721435546875, -1.6395263671875, -1.57183837890625, -1.504150390625, -1.43646240234375, -1.3687744140625, -1.30108642578125, -1.2333984375, -1.16571044921875, -1.0980224609375, -1.03033447265625, -0.962646484375, -0.89495849609375, -0.8272705078125, -0.75958251953125, -0.69189453125, -0.62420654296875, -0.5565185546875, -0.48883056640625, -0.421142578125, -0.35345458984375, -0.2857666015625, -0.21807861328125, -0.150390625, -0.08270263671875, -0.0150146484375, 0.05267333984375, 0.120361328125, 0.18804931640625, 0.2557373046875, 0.32342529296875, 0.39111328125, 0.45880126953125, 0.5264892578125, 0.59417724609375, 0.661865234375, 0.72955322265625, 0.7972412109375, 0.86492919921875, 0.9326171875, 1.00030517578125, 1.0679931640625, 1.13568115234375, 1.203369140625, 1.27105712890625, 1.3387451171875, 1.40643310546875, 1.47412109375, 1.54180908203125, 1.6094970703125, 1.67718505859375, 1.744873046875, 1.81256103515625, 1.8802490234375, 1.94793701171875, 2.015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 12.0, 20.0, 32.0, 37.0, 66.0, 86.0, 142.0, 201.0, 446.0, 667.0, 1239.0, 2299.0, 4345.0, 8550.0, 18324.0, 45852.0, 125796.0, 282814.0, 308126.0, 151778.0, 55471.0, 21291.0, 10039.0, 4962.0, 2690.0, 1359.0, 776.0, 430.0, 272.0, 168.0, 85.0, 50.0, 40.0, 25.0, 21.0, 11.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.09765625, -3.004058837890625, -2.91046142578125, -2.816864013671875, -2.7232666015625, -2.629669189453125, -2.53607177734375, -2.442474365234375, -2.348876953125, -2.255279541015625, -2.16168212890625, -2.068084716796875, -1.9744873046875, -1.880889892578125, -1.78729248046875, -1.693695068359375, -1.60009765625, -1.506500244140625, -1.41290283203125, -1.319305419921875, -1.2257080078125, -1.132110595703125, -1.03851318359375, -0.944915771484375, -0.851318359375, -0.757720947265625, -0.66412353515625, -0.570526123046875, -0.4769287109375, -0.383331298828125, -0.28973388671875, -0.196136474609375, -0.1025390625, -0.008941650390625, 0.08465576171875, 0.178253173828125, 0.2718505859375, 0.365447998046875, 0.45904541015625, 0.552642822265625, 0.646240234375, 0.739837646484375, 0.83343505859375, 0.927032470703125, 1.0206298828125, 1.114227294921875, 1.20782470703125, 1.301422119140625, 1.39501953125, 1.488616943359375, 1.58221435546875, 1.675811767578125, 1.7694091796875, 1.863006591796875, 1.95660400390625, 2.050201416015625, 2.143798828125, 2.237396240234375, 2.33099365234375, 2.424591064453125, 2.5181884765625, 2.611785888671875, 2.70538330078125, 2.798980712890625, 2.892578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 14.0, 6.0, 10.0, 10.0, 20.0, 18.0, 26.0, 36.0, 33.0, 44.0, 55.0, 50.0, 45.0, 68.0, 65.0, 56.0, 57.0, 54.0, 61.0, 53.0, 38.0, 38.0, 23.0, 24.0, 27.0, 18.0, 19.0, 16.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.5078125, -10.23016357421875, -9.9525146484375, -9.67486572265625, -9.397216796875, -9.11956787109375, -8.8419189453125, -8.56427001953125, -8.28662109375, -8.00897216796875, -7.7313232421875, -7.45367431640625, -7.176025390625, -6.89837646484375, -6.6207275390625, -6.34307861328125, -6.0654296875, -5.78778076171875, -5.5101318359375, -5.23248291015625, -4.954833984375, -4.67718505859375, -4.3995361328125, -4.12188720703125, -3.84423828125, -3.56658935546875, -3.2889404296875, -3.01129150390625, -2.733642578125, -2.45599365234375, -2.1783447265625, -1.90069580078125, -1.623046875, -1.34539794921875, -1.0677490234375, -0.79010009765625, -0.512451171875, -0.23480224609375, 0.0428466796875, 0.32049560546875, 0.59814453125, 0.87579345703125, 1.1534423828125, 1.43109130859375, 1.708740234375, 1.98638916015625, 2.2640380859375, 2.54168701171875, 2.8193359375, 3.09698486328125, 3.3746337890625, 3.65228271484375, 3.929931640625, 4.20758056640625, 4.4852294921875, 4.76287841796875, 5.04052734375, 5.31817626953125, 5.5958251953125, 5.87347412109375, 6.151123046875, 6.42877197265625, 6.7064208984375, 6.98406982421875, 7.26171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 16.0, 17.0, 37.0, 33.0, 54.0, 87.0, 119.0, 175.0, 250.0, 427.0, 555.0, 856.0, 1279.0, 2171.0, 3318.0, 5392.0, 8738.0, 14481.0, 24041.0, 39770.0, 66124.0, 106717.0, 154195.0, 180168.0, 157073.0, 109251.0, 68264.0, 40839.0, 24790.0, 14823.0, 9247.0, 5498.0, 3453.0, 2183.0, 1378.0, 902.0, 605.0, 385.0, 248.0, 176.0, 123.0, 69.0, 72.0, 45.0, 31.0, 22.0, 9.0, 13.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.5400390625, -0.5234375, -0.5068359375, -0.490234375, -0.4736328125, -0.45703125, -0.4404296875, -0.423828125, -0.4072265625, -0.390625, -0.3740234375, -0.357421875, -0.3408203125, -0.32421875, -0.3076171875, -0.291015625, -0.2744140625, -0.2578125, -0.2412109375, -0.224609375, -0.2080078125, -0.19140625, -0.1748046875, -0.158203125, -0.1416015625, -0.125, -0.1083984375, -0.091796875, -0.0751953125, -0.05859375, -0.0419921875, -0.025390625, -0.0087890625, 0.0078125, 0.0244140625, 0.041015625, 0.0576171875, 0.07421875, 0.0908203125, 0.107421875, 0.1240234375, 0.140625, 0.1572265625, 0.173828125, 0.1904296875, 0.20703125, 0.2236328125, 0.240234375, 0.2568359375, 0.2734375, 0.2900390625, 0.306640625, 0.3232421875, 0.33984375, 0.3564453125, 0.373046875, 0.3896484375, 0.40625, 0.4228515625, 0.439453125, 0.4560546875, 0.47265625, 0.4892578125, 0.505859375, 0.5224609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 6.0, 7.0, 5.0, 5.0, 12.0, 17.0, 10.0, 20.0, 36.0, 31.0, 54.0, 73.0, 91.0, 113.0, 123.0, 109.0, 79.0, 63.0, 35.0, 32.0, 18.0, 11.0, 18.0, 10.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004665851593017578, -0.00045154616236686707, -0.0004365071654319763, -0.00042146816849708557, -0.0004064291715621948, -0.0003913901746273041, -0.00037635117769241333, -0.0003613121807575226, -0.00034627318382263184, -0.0003312341868877411, -0.00031619518995285034, -0.0003011561930179596, -0.00028611719608306885, -0.0002710781991481781, -0.00025603920221328735, -0.0002410002052783966, -0.00022596120834350586, -0.0002109222114086151, -0.00019588321447372437, -0.00018084421753883362, -0.00016580522060394287, -0.00015076622366905212, -0.00013572722673416138, -0.00012068822979927063, -0.00010564923286437988, -9.061023592948914e-05, -7.557123899459839e-05, -6.053224205970764e-05, -4.5493245124816895e-05, -3.0454248189926147e-05, -1.54152512550354e-05, -3.762543201446533e-07, 1.4662742614746094e-05, 2.970173954963684e-05, 4.474073648452759e-05, 5.9779733419418335e-05, 7.481873035430908e-05, 8.985772728919983e-05, 0.00010489672422409058, 0.00011993572115898132, 0.00013497471809387207, 0.00015001371502876282, 0.00016505271196365356, 0.0001800917088985443, 0.00019513070583343506, 0.0002101697027683258, 0.00022520869970321655, 0.0002402476966381073, 0.00025528669357299805, 0.0002703256905078888, 0.00028536468744277954, 0.0003004036843776703, 0.00031544268131256104, 0.0003304816782474518, 0.00034552067518234253, 0.0003605596721172333, 0.000375598669052124, 0.00039063766598701477, 0.0004056766629219055, 0.00042071565985679626, 0.000435754656791687, 0.00045079365372657776, 0.0004658326506614685, 0.00048087164759635925, 0.00049591064453125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 10.0, 9.0, 19.0, 24.0, 52.0, 74.0, 124.0, 200.0, 343.0, 543.0, 999.0, 1878.0, 3567.0, 6981.0, 13505.0, 26917.0, 53218.0, 99926.0, 167074.0, 215270.0, 191529.0, 124917.0, 68872.0, 35486.0, 17753.0, 9048.0, 4675.0, 2491.0, 1295.0, 734.0, 409.0, 225.0, 145.0, 70.0, 40.0, 39.0, 29.0, 19.0, 16.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.7158203125, -0.6951904296875, -0.674560546875, -0.6539306640625, -0.63330078125, -0.6126708984375, -0.592041015625, -0.5714111328125, -0.55078125, -0.5301513671875, -0.509521484375, -0.4888916015625, -0.46826171875, -0.4476318359375, -0.427001953125, -0.4063720703125, -0.3857421875, -0.3651123046875, -0.344482421875, -0.3238525390625, -0.30322265625, -0.2825927734375, -0.261962890625, -0.2413330078125, -0.220703125, -0.2000732421875, -0.179443359375, -0.1588134765625, -0.13818359375, -0.1175537109375, -0.096923828125, -0.0762939453125, -0.0556640625, -0.0350341796875, -0.014404296875, 0.0062255859375, 0.02685546875, 0.0474853515625, 0.068115234375, 0.0887451171875, 0.109375, 0.1300048828125, 0.150634765625, 0.1712646484375, 0.19189453125, 0.2125244140625, 0.233154296875, 0.2537841796875, 0.2744140625, 0.2950439453125, 0.315673828125, 0.3363037109375, 0.35693359375, 0.3775634765625, 0.398193359375, 0.4188232421875, 0.439453125, 0.4600830078125, 0.480712890625, 0.5013427734375, 0.52197265625, 0.5426025390625, 0.563232421875, 0.5838623046875, 0.6044921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 7.0, 6.0, 9.0, 9.0, 14.0, 21.0, 12.0, 22.0, 24.0, 22.0, 28.0, 40.0, 46.0, 43.0, 39.0, 40.0, 68.0, 58.0, 40.0, 40.0, 48.0, 41.0, 52.0, 49.0, 38.0, 29.0, 28.0, 27.0, 11.0, 15.0, 9.0, 9.0, 8.0, 14.0, 9.0, 7.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.92822265625, -0.9015960693359375, -0.874969482421875, -0.8483428955078125, -0.82171630859375, -0.7950897216796875, -0.768463134765625, -0.7418365478515625, -0.7152099609375, -0.6885833740234375, -0.661956787109375, -0.6353302001953125, -0.60870361328125, -0.5820770263671875, -0.555450439453125, -0.5288238525390625, -0.502197265625, -0.4755706787109375, -0.448944091796875, -0.4223175048828125, -0.39569091796875, -0.3690643310546875, -0.342437744140625, -0.3158111572265625, -0.2891845703125, -0.2625579833984375, -0.235931396484375, -0.2093048095703125, -0.18267822265625, -0.1560516357421875, -0.129425048828125, -0.1027984619140625, -0.076171875, -0.0495452880859375, -0.022918701171875, 0.0037078857421875, 0.03033447265625, 0.0569610595703125, 0.083587646484375, 0.1102142333984375, 0.1368408203125, 0.1634674072265625, 0.190093994140625, 0.2167205810546875, 0.24334716796875, 0.2699737548828125, 0.296600341796875, 0.3232269287109375, 0.349853515625, 0.3764801025390625, 0.403106689453125, 0.4297332763671875, 0.45635986328125, 0.4829864501953125, 0.509613037109375, 0.5362396240234375, 0.5628662109375, 0.5894927978515625, 0.616119384765625, 0.6427459716796875, 0.66937255859375, 0.6959991455078125, 0.722625732421875, 0.7492523193359375, 0.77587890625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 12.0, 4.0, 17.0, 30.0, 38.0, 65.0, 116.0, 142.0, 163.0, 138.0, 105.0, 69.0, 30.0, 23.0, 13.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-24.56344985961914, -23.81045913696289, -23.05746841430664, -22.30447769165039, -21.55148696899414, -20.798498153686523, -20.045507431030273, -19.292516708374023, -18.539525985717773, -17.786535263061523, -17.033544540405273, -16.280553817749023, -15.52756404876709, -14.77457332611084, -14.021583557128906, -13.268592834472656, -12.515602111816406, -11.762611389160156, -11.009620666503906, -10.256630897521973, -9.503640174865723, -8.750649452209473, -7.997659206390381, -7.244668960571289, -6.491678237915039, -5.738687515258789, -4.985697269439697, -4.2327070236206055, -3.4797163009643555, -2.7267258167266846, -1.9737353324890137, -1.2207450866699219, -0.46775245666503906, 0.28523802757263184, 1.0382285118103027, 1.7912189960479736, 2.5442094802856445, 3.2971999645233154, 4.050190448760986, 4.803180694580078, 5.556171417236328, 6.309162139892578, 7.06215238571167, 7.815142631530762, 8.568133354187012, 9.321124076843262, 10.074113845825195, 10.827104568481445, 11.580095291137695, 12.333086013793945, 13.086076736450195, 13.839066505432129, 14.592057228088379, 15.345047950744629, 16.098037719726562, 16.851028442382812, 17.604019165039062, 18.357009887695312, 19.110000610351562, 19.862991333007812, 20.615982055664062, 21.36897087097168, 22.12196159362793, 22.87495231628418, 23.62794303894043]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 9.0, 13.0, 18.0, 13.0, 13.0, 23.0, 21.0, 19.0, 26.0, 30.0, 39.0, 35.0, 44.0, 34.0, 45.0, 37.0, 38.0, 35.0, 38.0, 44.0, 43.0, 32.0, 36.0, 26.0, 35.0, 27.0, 33.0, 23.0, 23.0, 18.0, 17.0, 15.0, 14.0, 16.0, 8.0, 8.0, 14.0, 6.0, 4.0, 2.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.432417869567871, -10.983609199523926, -10.534799575805664, -10.085990905761719, -9.637182235717773, -9.188373565673828, -8.739563941955566, -8.290755271911621, -7.841946125030518, -7.393136978149414, -6.944328308105469, -6.495519161224365, -6.046710014343262, -5.597901344299316, -5.149092197418213, -4.700283050537109, -4.251474380493164, -3.8026654720306396, -3.3538565635681152, -2.9050474166870117, -2.4562385082244873, -2.007429599761963, -1.5586204528808594, -1.109811544418335, -0.6610026359558105, -0.21219366788864136, 0.23661530017852783, 0.6854243278503418, 1.1342332363128662, 1.5830421447753906, 2.031851291656494, 2.4806602001190186, 2.9294700622558594, 3.378278970718384, 3.827087879180908, 4.275897026062012, 4.724705696105957, 5.1735148429870605, 5.622323989868164, 6.071132659912109, 6.519941806793213, 6.968750953674316, 7.417559623718262, 7.866368770599365, 8.315177917480469, 8.763986587524414, 9.21279525756836, 9.661604881286621, 10.110413551330566, 10.559222221374512, 11.008031845092773, 11.456840515136719, 11.905649185180664, 12.35445785522461, 12.803267478942871, 13.252076148986816, 13.700885772705078, 14.149694442749023, 14.598504066467285, 15.04731273651123, 15.496121406555176, 15.944931030273438, 16.393739700317383, 16.842548370361328, 17.291357040405273]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 8.0, 15.0, 17.0, 49.0, 60.0, 75.0, 179.0, 246.0, 477.0, 912.0, 1983.0, 4265.0, 10179.0, 27170.0, 85078.0, 302368.0, 923855.0, 1538689.0, 899975.0, 281929.0, 75787.0, 24166.0, 9148.0, 3909.0, 1766.0, 856.0, 476.0, 282.0, 150.0, 77.0, 53.0, 25.0, 28.0, 13.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.98455810546875, -1.9066162109375, -1.82867431640625, -1.750732421875, -1.67279052734375, -1.5948486328125, -1.51690673828125, -1.43896484375, -1.36102294921875, -1.2830810546875, -1.20513916015625, -1.127197265625, -1.04925537109375, -0.9713134765625, -0.89337158203125, -0.8154296875, -0.73748779296875, -0.6595458984375, -0.58160400390625, -0.503662109375, -0.42572021484375, -0.3477783203125, -0.26983642578125, -0.19189453125, -0.11395263671875, -0.0360107421875, 0.04193115234375, 0.119873046875, 0.19781494140625, 0.2757568359375, 0.35369873046875, 0.431640625, 0.50958251953125, 0.5875244140625, 0.66546630859375, 0.743408203125, 0.82135009765625, 0.8992919921875, 0.97723388671875, 1.05517578125, 1.13311767578125, 1.2110595703125, 1.28900146484375, 1.366943359375, 1.44488525390625, 1.5228271484375, 1.60076904296875, 1.6787109375, 1.75665283203125, 1.8345947265625, 1.91253662109375, 1.990478515625, 2.06842041015625, 2.1463623046875, 2.22430419921875, 2.30224609375, 2.38018798828125, 2.4581298828125, 2.53607177734375, 2.614013671875, 2.69195556640625, 2.7698974609375, 2.84783935546875, 2.92578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 10.0, 17.0, 8.0, 11.0, 22.0, 23.0, 14.0, 30.0, 33.0, 31.0, 37.0, 36.0, 32.0, 36.0, 38.0, 43.0, 40.0, 36.0, 42.0, 40.0, 39.0, 39.0, 45.0, 36.0, 37.0, 30.0, 26.0, 19.0, 12.0, 21.0, 24.0, 18.0, 13.0, 9.0, 15.0, 7.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.81640625, -1.75372314453125, -1.6910400390625, -1.62835693359375, -1.565673828125, -1.50299072265625, -1.4403076171875, -1.37762451171875, -1.31494140625, -1.25225830078125, -1.1895751953125, -1.12689208984375, -1.064208984375, -1.00152587890625, -0.9388427734375, -0.87615966796875, -0.8134765625, -0.75079345703125, -0.6881103515625, -0.62542724609375, -0.562744140625, -0.50006103515625, -0.4373779296875, -0.37469482421875, -0.31201171875, -0.24932861328125, -0.1866455078125, -0.12396240234375, -0.061279296875, 0.00140380859375, 0.0640869140625, 0.12677001953125, 0.189453125, 0.25213623046875, 0.3148193359375, 0.37750244140625, 0.440185546875, 0.50286865234375, 0.5655517578125, 0.62823486328125, 0.69091796875, 0.75360107421875, 0.8162841796875, 0.87896728515625, 0.941650390625, 1.00433349609375, 1.0670166015625, 1.12969970703125, 1.1923828125, 1.25506591796875, 1.3177490234375, 1.38043212890625, 1.443115234375, 1.50579833984375, 1.5684814453125, 1.63116455078125, 1.69384765625, 1.75653076171875, 1.8192138671875, 1.88189697265625, 1.944580078125, 2.00726318359375, 2.0699462890625, 2.13262939453125, 2.1953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 9.0, 9.0, 20.0, 24.0, 35.0, 57.0, 115.0, 210.0, 389.0, 820.0, 1758.0, 4138.0, 11838.0, 38225.0, 154735.0, 917048.0, 2420646.0, 505622.0, 98044.0, 26110.0, 8517.0, 3244.0, 1328.0, 648.0, 265.0, 170.0, 86.0, 68.0, 32.0, 21.0, 15.0, 14.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.611328125, -2.499481201171875, -2.38763427734375, -2.275787353515625, -2.1639404296875, -2.052093505859375, -1.94024658203125, -1.828399658203125, -1.716552734375, -1.604705810546875, -1.49285888671875, -1.381011962890625, -1.2691650390625, -1.157318115234375, -1.04547119140625, -0.933624267578125, -0.82177734375, -0.709930419921875, -0.59808349609375, -0.486236572265625, -0.3743896484375, -0.262542724609375, -0.15069580078125, -0.038848876953125, 0.072998046875, 0.184844970703125, 0.29669189453125, 0.408538818359375, 0.5203857421875, 0.632232666015625, 0.74407958984375, 0.855926513671875, 0.9677734375, 1.079620361328125, 1.19146728515625, 1.303314208984375, 1.4151611328125, 1.527008056640625, 1.63885498046875, 1.750701904296875, 1.862548828125, 1.974395751953125, 2.08624267578125, 2.198089599609375, 2.3099365234375, 2.421783447265625, 2.53363037109375, 2.645477294921875, 2.75732421875, 2.869171142578125, 2.98101806640625, 3.092864990234375, 3.2047119140625, 3.316558837890625, 3.42840576171875, 3.540252685546875, 3.652099609375, 3.763946533203125, 3.87579345703125, 3.987640380859375, 4.0994873046875, 4.211334228515625, 4.32318115234375, 4.435028076171875, 4.546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 10.0, 24.0, 14.0, 39.0, 51.0, 91.0, 114.0, 177.0, 295.0, 485.0, 692.0, 693.0, 519.0, 323.0, 182.0, 111.0, 83.0, 52.0, 41.0, 29.0, 20.0, 13.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96875, -5.8076171875, -5.646484375, -5.4853515625, -5.32421875, -5.1630859375, -5.001953125, -4.8408203125, -4.6796875, -4.5185546875, -4.357421875, -4.1962890625, -4.03515625, -3.8740234375, -3.712890625, -3.5517578125, -3.390625, -3.2294921875, -3.068359375, -2.9072265625, -2.74609375, -2.5849609375, -2.423828125, -2.2626953125, -2.1015625, -1.9404296875, -1.779296875, -1.6181640625, -1.45703125, -1.2958984375, -1.134765625, -0.9736328125, -0.8125, -0.6513671875, -0.490234375, -0.3291015625, -0.16796875, -0.0068359375, 0.154296875, 0.3154296875, 0.4765625, 0.6376953125, 0.798828125, 0.9599609375, 1.12109375, 1.2822265625, 1.443359375, 1.6044921875, 1.765625, 1.9267578125, 2.087890625, 2.2490234375, 2.41015625, 2.5712890625, 2.732421875, 2.8935546875, 3.0546875, 3.2158203125, 3.376953125, 3.5380859375, 3.69921875, 3.8603515625, 4.021484375, 4.1826171875, 4.34375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 11.0, 14.0, 37.0, 111.0, 184.0, 224.0, 200.0, 117.0, 52.0, 26.0, 12.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.118736267089844, -50.80192565917969, -49.48511505126953, -48.16830825805664, -46.851497650146484, -45.53468704223633, -44.21787643432617, -42.901065826416016, -41.584259033203125, -40.26744842529297, -38.95063781738281, -37.63383102416992, -36.317020416259766, -35.00020980834961, -33.68339920043945, -32.3665885925293, -31.04977798461914, -29.732967376708984, -28.41615867614746, -27.099348068237305, -25.78253936767578, -24.465728759765625, -23.14891815185547, -21.832107543945312, -20.51529884338379, -19.198488235473633, -17.88167953491211, -16.564868927001953, -15.248059272766113, -13.931249618530273, -12.614439010620117, -11.297629356384277, -9.980815887451172, -8.664006233215332, -7.347196102142334, -6.030385971069336, -4.713576316833496, -3.3967666625976562, -2.079956531524658, -0.7631464004516602, 0.5536632537841797, 1.8704731464385986, 3.1872830390930176, 4.504093170166016, 5.8209028244018555, 7.137712478637695, 8.454523086547852, 9.771332740783691, 11.088142395019531, 12.404952049255371, 13.721761703491211, 15.038572311401367, 16.35538101196289, 17.672191619873047, 18.989002227783203, 20.30581283569336, 21.622621536254883, 22.93943214416504, 24.256240844726562, 25.57305145263672, 26.889862060546875, 28.2066707611084, 29.523481369018555, 30.840290069580078, 32.157100677490234]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 10.0, 8.0, 9.0, 5.0, 9.0, 16.0, 16.0, 19.0, 25.0, 23.0, 19.0, 21.0, 33.0, 34.0, 26.0, 42.0, 28.0, 43.0, 46.0, 37.0, 36.0, 43.0, 34.0, 48.0, 36.0, 34.0, 28.0, 25.0, 30.0, 27.0, 15.0, 20.0, 16.0, 29.0, 13.0, 12.0, 11.0, 12.0, 11.0, 12.0, 11.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.721087455749512, -9.388763427734375, -9.056439399719238, -8.724115371704102, -8.391791343688965, -8.059467315673828, -7.727143287658691, -7.394819259643555, -7.062495231628418, -6.730171203613281, -6.3978471755981445, -6.065523147583008, -5.733199119567871, -5.400875091552734, -5.068551063537598, -4.736227035522461, -4.403903007507324, -4.0715789794921875, -3.739254951477051, -3.406930923461914, -3.0746068954467773, -2.7422828674316406, -2.409958839416504, -2.077634811401367, -1.7453107833862305, -1.4129867553710938, -1.080662727355957, -0.7483386993408203, -0.4160146713256836, -0.08369064331054688, 0.24863338470458984, 0.5809574127197266, 0.9132823944091797, 1.2456064224243164, 1.5779304504394531, 1.9102544784545898, 2.2425785064697266, 2.5749025344848633, 2.9072265625, 3.2395505905151367, 3.5718746185302734, 3.90419864654541, 4.236522674560547, 4.568846702575684, 4.90117073059082, 5.233494758605957, 5.565818786621094, 5.8981428146362305, 6.230466842651367, 6.562790870666504, 6.895114898681641, 7.227438926696777, 7.559762954711914, 7.892086982727051, 8.224411010742188, 8.556735038757324, 8.889059066772461, 9.221383094787598, 9.553707122802734, 9.886031150817871, 10.218355178833008, 10.550679206848145, 10.883003234863281, 11.215327262878418, 11.547651290893555]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 14.0, 17.0, 19.0, 26.0, 35.0, 71.0, 90.0, 158.0, 227.0, 392.0, 627.0, 1018.0, 1719.0, 3138.0, 5530.0, 9809.0, 17835.0, 32235.0, 56536.0, 94467.0, 142666.0, 179776.0, 173785.0, 131081.0, 84438.0, 49586.0, 28143.0, 15174.0, 8393.0, 4755.0, 2822.0, 1544.0, 908.0, 562.0, 317.0, 237.0, 147.0, 78.0, 57.0, 43.0, 26.0, 17.0, 16.0, 9.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.6982421875, -1.6481170654296875, -1.597991943359375, -1.5478668212890625, -1.49774169921875, -1.4476165771484375, -1.397491455078125, -1.3473663330078125, -1.2972412109375, -1.2471160888671875, -1.196990966796875, -1.1468658447265625, -1.09674072265625, -1.0466156005859375, -0.996490478515625, -0.9463653564453125, -0.896240234375, -0.8461151123046875, -0.795989990234375, -0.7458648681640625, -0.69573974609375, -0.6456146240234375, -0.595489501953125, -0.5453643798828125, -0.4952392578125, -0.4451141357421875, -0.394989013671875, -0.3448638916015625, -0.29473876953125, -0.2446136474609375, -0.194488525390625, -0.1443634033203125, -0.09423828125, -0.0441131591796875, 0.006011962890625, 0.0561370849609375, 0.10626220703125, 0.1563873291015625, 0.206512451171875, 0.2566375732421875, 0.3067626953125, 0.3568878173828125, 0.407012939453125, 0.4571380615234375, 0.50726318359375, 0.5573883056640625, 0.607513427734375, 0.6576385498046875, 0.707763671875, 0.7578887939453125, 0.808013916015625, 0.8581390380859375, 0.90826416015625, 0.9583892822265625, 1.008514404296875, 1.0586395263671875, 1.1087646484375, 1.1588897705078125, 1.209014892578125, 1.2591400146484375, 1.30926513671875, 1.3593902587890625, 1.409515380859375, 1.4596405029296875, 1.509765625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 6.0, 9.0, 6.0, 9.0, 13.0, 16.0, 12.0, 11.0, 37.0, 34.0, 33.0, 44.0, 46.0, 37.0, 38.0, 54.0, 44.0, 46.0, 60.0, 42.0, 45.0, 37.0, 51.0, 33.0, 45.0, 30.0, 28.0, 26.0, 16.0, 24.0, 25.0, 8.0, 10.0, 11.0, 4.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.4298095703125, -2.345947265625, -2.2620849609375, -2.17822265625, -2.0943603515625, -2.010498046875, -1.9266357421875, -1.8427734375, -1.7589111328125, -1.675048828125, -1.5911865234375, -1.50732421875, -1.4234619140625, -1.339599609375, -1.2557373046875, -1.171875, -1.0880126953125, -1.004150390625, -0.9202880859375, -0.83642578125, -0.7525634765625, -0.668701171875, -0.5848388671875, -0.5009765625, -0.4171142578125, -0.333251953125, -0.2493896484375, -0.16552734375, -0.0816650390625, 0.002197265625, 0.0860595703125, 0.169921875, 0.2537841796875, 0.337646484375, 0.4215087890625, 0.50537109375, 0.5892333984375, 0.673095703125, 0.7569580078125, 0.8408203125, 0.9246826171875, 1.008544921875, 1.0924072265625, 1.17626953125, 1.2601318359375, 1.343994140625, 1.4278564453125, 1.51171875, 1.5955810546875, 1.679443359375, 1.7633056640625, 1.84716796875, 1.9310302734375, 2.014892578125, 2.0987548828125, 2.1826171875, 2.2664794921875, 2.350341796875, 2.4342041015625, 2.51806640625, 2.6019287109375, 2.685791015625, 2.7696533203125, 2.853515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 11.0, 9.0, 21.0, 28.0, 35.0, 69.0, 87.0, 174.0, 292.0, 391.0, 779.0, 1372.0, 2581.0, 5082.0, 10533.0, 22475.0, 48468.0, 103472.0, 197783.0, 287824.0, 186216.0, 95276.0, 44730.0, 20447.0, 9808.0, 4865.0, 2445.0, 1381.0, 719.0, 436.0, 281.0, 178.0, 106.0, 59.0, 37.0, 23.0, 22.0, 4.0, 8.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.236328125, -2.169464111328125, -2.10260009765625, -2.035736083984375, -1.9688720703125, -1.902008056640625, -1.83514404296875, -1.768280029296875, -1.701416015625, -1.634552001953125, -1.56768798828125, -1.500823974609375, -1.4339599609375, -1.367095947265625, -1.30023193359375, -1.233367919921875, -1.16650390625, -1.099639892578125, -1.03277587890625, -0.965911865234375, -0.8990478515625, -0.832183837890625, -0.76531982421875, -0.698455810546875, -0.631591796875, -0.564727783203125, -0.49786376953125, -0.430999755859375, -0.3641357421875, -0.297271728515625, -0.23040771484375, -0.163543701171875, -0.0966796875, -0.029815673828125, 0.03704833984375, 0.103912353515625, 0.1707763671875, 0.237640380859375, 0.30450439453125, 0.371368408203125, 0.438232421875, 0.505096435546875, 0.57196044921875, 0.638824462890625, 0.7056884765625, 0.772552490234375, 0.83941650390625, 0.906280517578125, 0.97314453125, 1.040008544921875, 1.10687255859375, 1.173736572265625, 1.2406005859375, 1.307464599609375, 1.37432861328125, 1.441192626953125, 1.508056640625, 1.574920654296875, 1.64178466796875, 1.708648681640625, 1.7755126953125, 1.842376708984375, 1.90924072265625, 1.976104736328125, 2.04296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 11.0, 17.0, 26.0, 14.0, 15.0, 22.0, 25.0, 30.0, 33.0, 33.0, 50.0, 38.0, 42.0, 39.0, 49.0, 38.0, 36.0, 43.0, 40.0, 46.0, 42.0, 48.0, 35.0, 30.0, 29.0, 20.0, 19.0, 14.0, 17.0, 19.0, 15.0, 10.0, 7.0, 2.0, 4.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.9453125, -5.7509765625, -5.556640625, -5.3623046875, -5.16796875, -4.9736328125, -4.779296875, -4.5849609375, -4.390625, -4.1962890625, -4.001953125, -3.8076171875, -3.61328125, -3.4189453125, -3.224609375, -3.0302734375, -2.8359375, -2.6416015625, -2.447265625, -2.2529296875, -2.05859375, -1.8642578125, -1.669921875, -1.4755859375, -1.28125, -1.0869140625, -0.892578125, -0.6982421875, -0.50390625, -0.3095703125, -0.115234375, 0.0791015625, 0.2734375, 0.4677734375, 0.662109375, 0.8564453125, 1.05078125, 1.2451171875, 1.439453125, 1.6337890625, 1.828125, 2.0224609375, 2.216796875, 2.4111328125, 2.60546875, 2.7998046875, 2.994140625, 3.1884765625, 3.3828125, 3.5771484375, 3.771484375, 3.9658203125, 4.16015625, 4.3544921875, 4.548828125, 4.7431640625, 4.9375, 5.1318359375, 5.326171875, 5.5205078125, 5.71484375, 5.9091796875, 6.103515625, 6.2978515625, 6.4921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 10.0, 10.0, 12.0, 21.0, 31.0, 49.0, 71.0, 105.0, 157.0, 262.0, 406.0, 741.0, 1364.0, 2185.0, 4118.0, 7388.0, 13546.0, 25270.0, 46254.0, 81642.0, 136890.0, 225735.0, 199118.0, 130203.0, 77388.0, 43479.0, 23528.0, 12728.0, 6727.0, 3880.0, 2082.0, 1264.0, 724.0, 441.0, 267.0, 170.0, 98.0, 55.0, 37.0, 22.0, 22.0, 8.0, 14.0, 5.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.395263671875, -0.3824920654296875, -0.369720458984375, -0.3569488525390625, -0.34417724609375, -0.3314056396484375, -0.318634033203125, -0.3058624267578125, -0.2930908203125, -0.2803192138671875, -0.267547607421875, -0.2547760009765625, -0.24200439453125, -0.2292327880859375, -0.216461181640625, -0.2036895751953125, -0.19091796875, -0.1781463623046875, -0.165374755859375, -0.1526031494140625, -0.13983154296875, -0.1270599365234375, -0.114288330078125, -0.1015167236328125, -0.0887451171875, -0.0759735107421875, -0.063201904296875, -0.0504302978515625, -0.03765869140625, -0.0248870849609375, -0.012115478515625, 0.0006561279296875, 0.013427734375, 0.0261993408203125, 0.038970947265625, 0.0517425537109375, 0.06451416015625, 0.0772857666015625, 0.090057373046875, 0.1028289794921875, 0.1156005859375, 0.1283721923828125, 0.141143798828125, 0.1539154052734375, 0.16668701171875, 0.1794586181640625, 0.192230224609375, 0.2050018310546875, 0.2177734375, 0.2305450439453125, 0.243316650390625, 0.2560882568359375, 0.26885986328125, 0.2816314697265625, 0.294403076171875, 0.3071746826171875, 0.3199462890625, 0.3327178955078125, 0.345489501953125, 0.3582611083984375, 0.37103271484375, 0.3838043212890625, 0.396575927734375, 0.4093475341796875, 0.422119140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 3.0, 6.0, 15.0, 19.0, 18.0, 25.0, 35.0, 35.0, 39.0, 34.0, 38.0, 64.0, 52.0, 74.0, 62.0, 67.0, 52.0, 60.0, 50.0, 47.0, 23.0, 30.0, 24.0, 19.0, 18.0, 21.0, 6.0, 9.0, 7.0, 8.0, 5.0, 2.0, 2.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002390146255493164, -0.00023225508630275726, -0.00022549554705619812, -0.00021873600780963898, -0.00021197646856307983, -0.0002052169293165207, -0.00019845739006996155, -0.0001916978508234024, -0.00018493831157684326, -0.00017817877233028412, -0.00017141923308372498, -0.00016465969383716583, -0.0001579001545906067, -0.00015114061534404755, -0.0001443810760974884, -0.00013762153685092926, -0.00013086199760437012, -0.00012410245835781097, -0.00011734291911125183, -0.00011058337986469269, -0.00010382384061813354, -9.70643013715744e-05, -9.030476212501526e-05, -8.354522287845612e-05, -7.678568363189697e-05, -7.002614438533783e-05, -6.326660513877869e-05, -5.6507065892219543e-05, -4.97475266456604e-05, -4.298798739910126e-05, -3.6228448152542114e-05, -2.946890890598297e-05, -2.2709369659423828e-05, -1.5949830412864685e-05, -9.190291166305542e-06, -2.430751919746399e-06, 4.328787326812744e-06, 1.1088326573371887e-05, 1.784786581993103e-05, 2.4607405066490173e-05, 3.1366944313049316e-05, 3.812648355960846e-05, 4.48860228061676e-05, 5.1645562052726746e-05, 5.840510129928589e-05, 6.516464054584503e-05, 7.192417979240417e-05, 7.868371903896332e-05, 8.544325828552246e-05, 9.22027975320816e-05, 9.896233677864075e-05, 0.00010572187602519989, 0.00011248141527175903, 0.00011924095451831818, 0.00012600049376487732, 0.00013276003301143646, 0.0001395195722579956, 0.00014627911150455475, 0.0001530386507511139, 0.00015979818999767303, 0.00016655772924423218, 0.00017331726849079132, 0.00018007680773735046, 0.0001868363469839096, 0.00019359588623046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 9.0, 17.0, 20.0, 33.0, 64.0, 119.0, 218.0, 364.0, 753.0, 1404.0, 2765.0, 5753.0, 11500.0, 23738.0, 46743.0, 88468.0, 152532.0, 246640.0, 199260.0, 125629.0, 70355.0, 36279.0, 18263.0, 8822.0, 4355.0, 2136.0, 1049.0, 550.0, 312.0, 161.0, 91.0, 64.0, 30.0, 21.0, 10.0, 6.0, 8.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.55859375, -0.5434188842773438, -0.5282440185546875, -0.5130691528320312, -0.497894287109375, -0.48271942138671875, -0.4675445556640625, -0.45236968994140625, -0.43719482421875, -0.42201995849609375, -0.4068450927734375, -0.39167022705078125, -0.376495361328125, -0.36132049560546875, -0.3461456298828125, -0.33097076416015625, -0.3157958984375, -0.30062103271484375, -0.2854461669921875, -0.27027130126953125, -0.255096435546875, -0.23992156982421875, -0.2247467041015625, -0.20957183837890625, -0.19439697265625, -0.17922210693359375, -0.1640472412109375, -0.14887237548828125, -0.133697509765625, -0.11852264404296875, -0.1033477783203125, -0.08817291259765625, -0.072998046875, -0.05782318115234375, -0.0426483154296875, -0.02747344970703125, -0.012298583984375, 0.00287628173828125, 0.0180511474609375, 0.03322601318359375, 0.04840087890625, 0.06357574462890625, 0.0787506103515625, 0.09392547607421875, 0.109100341796875, 0.12427520751953125, 0.1394500732421875, 0.15462493896484375, 0.1697998046875, 0.18497467041015625, 0.2001495361328125, 0.21532440185546875, 0.230499267578125, 0.24567413330078125, 0.2608489990234375, 0.27602386474609375, 0.29119873046875, 0.30637359619140625, 0.3215484619140625, 0.33672332763671875, 0.351898193359375, 0.36707305908203125, 0.3822479248046875, 0.39742279052734375, 0.41259765625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 3.0, 5.0, 4.0, 3.0, 7.0, 14.0, 9.0, 10.0, 20.0, 18.0, 18.0, 22.0, 35.0, 32.0, 34.0, 26.0, 45.0, 48.0, 48.0, 47.0, 50.0, 56.0, 54.0, 50.0, 52.0, 41.0, 34.0, 29.0, 47.0, 25.0, 21.0, 14.0, 12.0, 15.0, 6.0, 9.0, 6.0, 5.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.599609375, -0.5784912109375, -0.557373046875, -0.5362548828125, -0.51513671875, -0.4940185546875, -0.472900390625, -0.4517822265625, -0.4306640625, -0.4095458984375, -0.388427734375, -0.3673095703125, -0.34619140625, -0.3250732421875, -0.303955078125, -0.2828369140625, -0.26171875, -0.2406005859375, -0.219482421875, -0.1983642578125, -0.17724609375, -0.1561279296875, -0.135009765625, -0.1138916015625, -0.0927734375, -0.0716552734375, -0.050537109375, -0.0294189453125, -0.00830078125, 0.0128173828125, 0.033935546875, 0.0550537109375, 0.076171875, 0.0972900390625, 0.118408203125, 0.1395263671875, 0.16064453125, 0.1817626953125, 0.202880859375, 0.2239990234375, 0.2451171875, 0.2662353515625, 0.287353515625, 0.3084716796875, 0.32958984375, 0.3507080078125, 0.371826171875, 0.3929443359375, 0.4140625, 0.4351806640625, 0.456298828125, 0.4774169921875, 0.49853515625, 0.5196533203125, 0.540771484375, 0.5618896484375, 0.5830078125, 0.6041259765625, 0.625244140625, 0.6463623046875, 0.66748046875, 0.6885986328125, 0.709716796875, 0.7308349609375, 0.751953125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 6.0, 8.0, 16.0, 20.0, 29.0, 69.0, 121.0, 136.0, 167.0, 144.0, 120.0, 60.0, 52.0, 19.0, 12.0, 11.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.49358558654785, -19.80167579650879, -19.10976791381836, -18.417858123779297, -17.725950241088867, -17.034040451049805, -16.342132568359375, -15.650222778320312, -14.95831298828125, -14.266404151916504, -13.574495315551758, -12.882585525512695, -12.19067668914795, -11.498767852783203, -10.806859016418457, -10.114950180053711, -9.423041343688965, -8.731132507324219, -8.039223670959473, -7.347314357757568, -6.655405044555664, -5.963496208190918, -5.271587371826172, -4.579678058624268, -3.8877692222595215, -3.1958601474761963, -2.503951072692871, -1.812042236328125, -1.1201331615447998, -0.4282240867614746, 0.2636847496032715, 0.9555940628051758, 1.6475028991699219, 2.339411973953247, 3.0313210487365723, 3.7232298851013184, 4.415139198303223, 5.107048034667969, 5.798956871032715, 6.490866184234619, 7.182775020599365, 7.874683856964111, 8.566593170166016, 9.258502006530762, 9.950410842895508, 10.64232063293457, 11.334228515625, 12.026138305664062, 12.718047142028809, 13.409955978393555, 14.1018648147583, 14.793773651123047, 15.48568344116211, 16.177593231201172, 16.8695011138916, 17.561410903930664, 18.253318786621094, 18.945228576660156, 19.637136459350586, 20.32904624938965, 21.020954132080078, 21.71286392211914, 22.404773712158203, 23.096681594848633, 23.788591384887695]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 3.0, 4.0, 16.0, 8.0, 16.0, 23.0, 25.0, 21.0, 18.0, 26.0, 38.0, 31.0, 35.0, 34.0, 35.0, 31.0, 47.0, 43.0, 41.0, 52.0, 42.0, 46.0, 39.0, 34.0, 26.0, 39.0, 31.0, 28.0, 31.0, 25.0, 23.0, 16.0, 9.0, 9.0, 7.0, 9.0, 8.0, 3.0, 4.0, 3.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.553396224975586, -15.088220596313477, -14.623044967651367, -14.157869338989258, -13.692693710327148, -13.227518081665039, -12.762343406677246, -12.297167778015137, -11.831992149353027, -11.366816520690918, -10.901640892028809, -10.4364652633667, -9.971290588378906, -9.506114959716797, -9.040939331054688, -8.575763702392578, -8.110588073730469, -7.645412445068359, -7.18023681640625, -6.715061664581299, -6.2498860359191895, -5.78471040725708, -5.319535255432129, -4.8543596267700195, -4.38918399810791, -3.924008369445801, -3.4588329792022705, -2.9936575889587402, -2.528481960296631, -2.0633063316345215, -1.5981309413909912, -1.132955551147461, -0.667780876159668, -0.20260536670684814, 0.2625701427459717, 0.7277456521987915, 1.1929211616516113, 1.6580967903137207, 2.123272180557251, 2.5884475708007812, 3.0536231994628906, 3.518798828125, 3.9839742183685303, 4.4491496086120605, 4.91432523727417, 5.379500865936279, 5.8446760177612305, 6.30985164642334, 6.775027275085449, 7.240202903747559, 7.705378532409668, 8.170554161071777, 8.63572883605957, 9.10090446472168, 9.566080093383789, 10.031255722045898, 10.496431350708008, 10.961606979370117, 11.426782608032227, 11.891958236694336, 12.357133865356445, 12.822309494018555, 13.287484169006348, 13.752659797668457, 14.217835426330566]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 8.0, 9.0, 20.0, 34.0, 49.0, 64.0, 137.0, 205.0, 331.0, 639.0, 1040.0, 2258.0, 4523.0, 9081.0, 20066.0, 51971.0, 134535.0, 318247.0, 618199.0, 892942.0, 915797.0, 652851.0, 339516.0, 140571.0, 53363.0, 20456.0, 8722.0, 4109.0, 1982.0, 1059.0, 612.0, 308.0, 210.0, 122.0, 105.0, 41.0, 34.0, 23.0, 16.0, 9.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8857421875, -1.830322265625, -1.77490234375, -1.719482421875, -1.6640625, -1.608642578125, -1.55322265625, -1.497802734375, -1.4423828125, -1.386962890625, -1.33154296875, -1.276123046875, -1.220703125, -1.165283203125, -1.10986328125, -1.054443359375, -0.9990234375, -0.943603515625, -0.88818359375, -0.832763671875, -0.77734375, -0.721923828125, -0.66650390625, -0.611083984375, -0.5556640625, -0.500244140625, -0.44482421875, -0.389404296875, -0.333984375, -0.278564453125, -0.22314453125, -0.167724609375, -0.1123046875, -0.056884765625, -0.00146484375, 0.053955078125, 0.109375, 0.164794921875, 0.22021484375, 0.275634765625, 0.3310546875, 0.386474609375, 0.44189453125, 0.497314453125, 0.552734375, 0.608154296875, 0.66357421875, 0.718994140625, 0.7744140625, 0.829833984375, 0.88525390625, 0.940673828125, 0.99609375, 1.051513671875, 1.10693359375, 1.162353515625, 1.2177734375, 1.273193359375, 1.32861328125, 1.384033203125, 1.439453125, 1.494873046875, 1.55029296875, 1.605712890625, 1.6611328125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 17.0, 14.0, 14.0, 22.0, 24.0, 30.0, 39.0, 37.0, 34.0, 50.0, 46.0, 62.0, 49.0, 59.0, 50.0, 55.0, 52.0, 52.0, 43.0, 41.0, 38.0, 32.0, 31.0, 16.0, 17.0, 16.0, 9.0, 9.0, 7.0, 11.0, 4.0, 8.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.956756591796875, -1.87835693359375, -1.799957275390625, -1.7215576171875, -1.643157958984375, -1.56475830078125, -1.486358642578125, -1.407958984375, -1.329559326171875, -1.25115966796875, -1.172760009765625, -1.0943603515625, -1.015960693359375, -0.93756103515625, -0.859161376953125, -0.78076171875, -0.702362060546875, -0.62396240234375, -0.545562744140625, -0.4671630859375, -0.388763427734375, -0.31036376953125, -0.231964111328125, -0.153564453125, -0.075164794921875, 0.00323486328125, 0.081634521484375, 0.1600341796875, 0.238433837890625, 0.31683349609375, 0.395233154296875, 0.4736328125, 0.552032470703125, 0.63043212890625, 0.708831787109375, 0.7872314453125, 0.865631103515625, 0.94403076171875, 1.022430419921875, 1.100830078125, 1.179229736328125, 1.25762939453125, 1.336029052734375, 1.4144287109375, 1.492828369140625, 1.57122802734375, 1.649627685546875, 1.72802734375, 1.806427001953125, 1.88482666015625, 1.963226318359375, 2.0416259765625, 2.120025634765625, 2.19842529296875, 2.276824951171875, 2.355224609375, 2.433624267578125, 2.51202392578125, 2.590423583984375, 2.6688232421875, 2.747222900390625, 2.82562255859375, 2.904022216796875, 2.982421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 4.0, 10.0, 13.0, 14.0, 20.0, 25.0, 57.0, 97.0, 136.0, 260.0, 436.0, 858.0, 1810.0, 5905.0, 34006.0, 453494.0, 3226659.0, 429389.0, 32116.0, 5644.0, 1726.0, 739.0, 364.0, 184.0, 136.0, 74.0, 33.0, 24.0, 23.0, 9.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.18511962890625, -4.0069580078125, -3.82879638671875, -3.650634765625, -3.47247314453125, -3.2943115234375, -3.11614990234375, -2.93798828125, -2.75982666015625, -2.5816650390625, -2.40350341796875, -2.225341796875, -2.04718017578125, -1.8690185546875, -1.69085693359375, -1.5126953125, -1.33453369140625, -1.1563720703125, -0.97821044921875, -0.800048828125, -0.62188720703125, -0.4437255859375, -0.26556396484375, -0.08740234375, 0.09075927734375, 0.2689208984375, 0.44708251953125, 0.625244140625, 0.80340576171875, 0.9815673828125, 1.15972900390625, 1.337890625, 1.51605224609375, 1.6942138671875, 1.87237548828125, 2.050537109375, 2.22869873046875, 2.4068603515625, 2.58502197265625, 2.76318359375, 2.94134521484375, 3.1195068359375, 3.29766845703125, 3.475830078125, 3.65399169921875, 3.8321533203125, 4.01031494140625, 4.1884765625, 4.36663818359375, 4.5447998046875, 4.72296142578125, 4.901123046875, 5.07928466796875, 5.2574462890625, 5.43560791015625, 5.61376953125, 5.79193115234375, 5.9700927734375, 6.14825439453125, 6.326416015625, 6.50457763671875, 6.6827392578125, 6.86090087890625, 7.0390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 8.0, 13.0, 14.0, 20.0, 30.0, 49.0, 67.0, 109.0, 142.0, 200.0, 255.0, 317.0, 410.0, 450.0, 430.0, 372.0, 298.0, 246.0, 174.0, 136.0, 91.0, 85.0, 47.0, 28.0, 33.0, 10.0, 14.0, 14.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.585693359375, -4.44091796875, -4.296142578125, -4.1513671875, -4.006591796875, -3.86181640625, -3.717041015625, -3.572265625, -3.427490234375, -3.28271484375, -3.137939453125, -2.9931640625, -2.848388671875, -2.70361328125, -2.558837890625, -2.4140625, -2.269287109375, -2.12451171875, -1.979736328125, -1.8349609375, -1.690185546875, -1.54541015625, -1.400634765625, -1.255859375, -1.111083984375, -0.96630859375, -0.821533203125, -0.6767578125, -0.531982421875, -0.38720703125, -0.242431640625, -0.09765625, 0.047119140625, 0.19189453125, 0.336669921875, 0.4814453125, 0.626220703125, 0.77099609375, 0.915771484375, 1.060546875, 1.205322265625, 1.35009765625, 1.494873046875, 1.6396484375, 1.784423828125, 1.92919921875, 2.073974609375, 2.21875, 2.363525390625, 2.50830078125, 2.653076171875, 2.7978515625, 2.942626953125, 3.08740234375, 3.232177734375, 3.376953125, 3.521728515625, 3.66650390625, 3.811279296875, 3.9560546875, 4.100830078125, 4.24560546875, 4.390380859375, 4.53515625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 16.0, 21.0, 27.0, 42.0, 72.0, 107.0, 139.0, 132.0, 126.0, 99.0, 63.0, 43.0, 40.0, 28.0, 16.0, 4.0, 6.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.61034393310547, -47.10532760620117, -45.600311279296875, -44.095298767089844, -42.59028244018555, -41.08526611328125, -39.58024978637695, -38.075233459472656, -36.570220947265625, -35.06520462036133, -33.56018829345703, -32.05517578125, -30.550159454345703, -29.045143127441406, -27.54012680053711, -26.035110473632812, -24.530094146728516, -23.02507781982422, -21.520063400268555, -20.015047073364258, -18.510032653808594, -17.005016326904297, -15.5, -13.99498462677002, -12.489969253540039, -10.984953880310059, -9.479938507080078, -7.974922180175781, -6.469906806945801, -4.96489143371582, -3.4598751068115234, -1.954859733581543, -0.4498481750488281, 1.0551674365997314, 2.560183048248291, 4.06519889831543, 5.57021427154541, 7.075229644775391, 8.580245971679688, 10.085261344909668, 11.590276718139648, 13.095292091369629, 14.60030746459961, 16.105323791503906, 17.610340118408203, 19.115354537963867, 20.620370864868164, 22.125385284423828, 23.630401611328125, 25.135417938232422, 26.640432357788086, 28.145448684692383, 29.650463104248047, 31.155479431152344, 32.66049575805664, 34.16551208496094, 35.67052459716797, 37.175540924072266, 38.68055725097656, 40.185569763183594, 41.69058609008789, 43.19560241699219, 44.700618743896484, 46.20563507080078, 47.71065139770508]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 7.0, 5.0, 4.0, 6.0, 7.0, 11.0, 13.0, 12.0, 15.0, 23.0, 23.0, 22.0, 28.0, 32.0, 42.0, 31.0, 32.0, 41.0, 43.0, 34.0, 36.0, 31.0, 44.0, 48.0, 35.0, 35.0, 47.0, 30.0, 35.0, 33.0, 28.0, 21.0, 24.0, 19.0, 18.0, 17.0, 14.0, 15.0, 6.0, 7.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-16.908281326293945, -16.39325523376465, -15.878228187561035, -15.363201141357422, -14.848175048828125, -14.333148956298828, -13.818121910095215, -13.303094863891602, -12.788068771362305, -12.273042678833008, -11.758015632629395, -11.242988586425781, -10.727962493896484, -10.212936401367188, -9.697909355163574, -9.182882308959961, -8.667856216430664, -8.152830123901367, -7.637803077697754, -7.122776508331299, -6.607749938964844, -6.092723369598389, -5.577696800231934, -5.0626702308654785, -4.547643661499023, -4.032617092132568, -3.5175905227661133, -3.002563953399658, -2.487537384033203, -1.972510814666748, -1.457484245300293, -0.9424576759338379, -0.42742919921875, 0.08759737014770508, 0.6026239395141602, 1.1176505088806152, 1.6326770782470703, 2.1477036476135254, 2.6627302169799805, 3.1777567863464355, 3.6927833557128906, 4.207809925079346, 4.722836494445801, 5.237863063812256, 5.752889633178711, 6.267916202545166, 6.782942771911621, 7.297969341278076, 7.812995910644531, 8.328022003173828, 8.843049049377441, 9.358076095581055, 9.873102188110352, 10.388128280639648, 10.903155326843262, 11.418182373046875, 11.933208465576172, 12.448234558105469, 12.963261604309082, 13.478288650512695, 13.993314743041992, 14.508340835571289, 15.023367881774902, 15.538394927978516, 16.053421020507812]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 10.0, 12.0, 12.0, 21.0, 20.0, 51.0, 64.0, 100.0, 184.0, 247.0, 551.0, 1071.0, 2371.0, 5723.0, 16302.0, 60108.0, 273446.0, 484918.0, 150535.0, 34789.0, 10506.0, 4015.0, 1705.0, 761.0, 443.0, 216.0, 119.0, 82.0, 50.0, 30.0, 24.0, 17.0, 16.0, 11.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.724609375, -2.6402587890625, -2.555908203125, -2.4715576171875, -2.38720703125, -2.3028564453125, -2.218505859375, -2.1341552734375, -2.0498046875, -1.9654541015625, -1.881103515625, -1.7967529296875, -1.71240234375, -1.6280517578125, -1.543701171875, -1.4593505859375, -1.375, -1.2906494140625, -1.206298828125, -1.1219482421875, -1.03759765625, -0.9532470703125, -0.868896484375, -0.7845458984375, -0.7001953125, -0.6158447265625, -0.531494140625, -0.4471435546875, -0.36279296875, -0.2784423828125, -0.194091796875, -0.1097412109375, -0.025390625, 0.0589599609375, 0.143310546875, 0.2276611328125, 0.31201171875, 0.3963623046875, 0.480712890625, 0.5650634765625, 0.6494140625, 0.7337646484375, 0.818115234375, 0.9024658203125, 0.98681640625, 1.0711669921875, 1.155517578125, 1.2398681640625, 1.32421875, 1.4085693359375, 1.492919921875, 1.5772705078125, 1.66162109375, 1.7459716796875, 1.830322265625, 1.9146728515625, 1.9990234375, 2.0833740234375, 2.167724609375, 2.2520751953125, 2.33642578125, 2.4207763671875, 2.505126953125, 2.5894775390625, 2.673828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 9.0, 7.0, 8.0, 12.0, 21.0, 25.0, 25.0, 20.0, 40.0, 33.0, 27.0, 42.0, 38.0, 46.0, 60.0, 62.0, 54.0, 47.0, 43.0, 58.0, 46.0, 38.0, 39.0, 31.0, 32.0, 26.0, 19.0, 20.0, 12.0, 18.0, 13.0, 9.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.125, -3.026214599609375, -2.92742919921875, -2.828643798828125, -2.7298583984375, -2.631072998046875, -2.53228759765625, -2.433502197265625, -2.334716796875, -2.235931396484375, -2.13714599609375, -2.038360595703125, -1.9395751953125, -1.840789794921875, -1.74200439453125, -1.643218994140625, -1.54443359375, -1.445648193359375, -1.34686279296875, -1.248077392578125, -1.1492919921875, -1.050506591796875, -0.95172119140625, -0.852935791015625, -0.754150390625, -0.655364990234375, -0.55657958984375, -0.457794189453125, -0.3590087890625, -0.260223388671875, -0.16143798828125, -0.062652587890625, 0.0361328125, 0.134918212890625, 0.23370361328125, 0.332489013671875, 0.4312744140625, 0.530059814453125, 0.62884521484375, 0.727630615234375, 0.826416015625, 0.925201416015625, 1.02398681640625, 1.122772216796875, 1.2215576171875, 1.320343017578125, 1.41912841796875, 1.517913818359375, 1.61669921875, 1.715484619140625, 1.81427001953125, 1.913055419921875, 2.0118408203125, 2.110626220703125, 2.20941162109375, 2.308197021484375, 2.406982421875, 2.505767822265625, 2.60455322265625, 2.703338623046875, 2.8021240234375, 2.900909423828125, 2.99969482421875, 3.098480224609375, 3.197265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 3.0, 6.0, 12.0, 17.0, 24.0, 15.0, 40.0, 53.0, 79.0, 153.0, 182.0, 308.0, 521.0, 989.0, 1872.0, 3988.0, 9173.0, 24768.0, 84715.0, 434852.0, 364803.0, 80686.0, 24245.0, 8972.0, 3868.0, 1810.0, 987.0, 538.0, 283.0, 194.0, 109.0, 90.0, 55.0, 43.0, 22.0, 24.0, 14.0, 14.0, 10.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0], "bins": [-2.734375, -2.65838623046875, -2.5823974609375, -2.50640869140625, -2.430419921875, -2.35443115234375, -2.2784423828125, -2.20245361328125, -2.12646484375, -2.05047607421875, -1.9744873046875, -1.89849853515625, -1.822509765625, -1.74652099609375, -1.6705322265625, -1.59454345703125, -1.5185546875, -1.44256591796875, -1.3665771484375, -1.29058837890625, -1.214599609375, -1.13861083984375, -1.0626220703125, -0.98663330078125, -0.91064453125, -0.83465576171875, -0.7586669921875, -0.68267822265625, -0.606689453125, -0.53070068359375, -0.4547119140625, -0.37872314453125, -0.302734375, -0.22674560546875, -0.1507568359375, -0.07476806640625, 0.001220703125, 0.07720947265625, 0.1531982421875, 0.22918701171875, 0.30517578125, 0.38116455078125, 0.4571533203125, 0.53314208984375, 0.609130859375, 0.68511962890625, 0.7611083984375, 0.83709716796875, 0.9130859375, 0.98907470703125, 1.0650634765625, 1.14105224609375, 1.217041015625, 1.29302978515625, 1.3690185546875, 1.44500732421875, 1.52099609375, 1.59698486328125, 1.6729736328125, 1.74896240234375, 1.824951171875, 1.90093994140625, 1.9769287109375, 2.05291748046875, 2.12890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 10.0, 9.0, 18.0, 18.0, 21.0, 29.0, 40.0, 37.0, 36.0, 44.0, 42.0, 59.0, 59.0, 68.0, 63.0, 44.0, 49.0, 43.0, 47.0, 47.0, 37.0, 31.0, 30.0, 18.0, 23.0, 14.0, 8.0, 9.0, 8.0, 2.0, 7.0, 4.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.5474853515625, -7.305908203125, -7.0643310546875, -6.82275390625, -6.5811767578125, -6.339599609375, -6.0980224609375, -5.8564453125, -5.6148681640625, -5.373291015625, -5.1317138671875, -4.89013671875, -4.6485595703125, -4.406982421875, -4.1654052734375, -3.923828125, -3.6822509765625, -3.440673828125, -3.1990966796875, -2.95751953125, -2.7159423828125, -2.474365234375, -2.2327880859375, -1.9912109375, -1.7496337890625, -1.508056640625, -1.2664794921875, -1.02490234375, -0.7833251953125, -0.541748046875, -0.3001708984375, -0.05859375, 0.1829833984375, 0.424560546875, 0.6661376953125, 0.90771484375, 1.1492919921875, 1.390869140625, 1.6324462890625, 1.8740234375, 2.1156005859375, 2.357177734375, 2.5987548828125, 2.84033203125, 3.0819091796875, 3.323486328125, 3.5650634765625, 3.806640625, 4.0482177734375, 4.289794921875, 4.5313720703125, 4.77294921875, 5.0145263671875, 5.256103515625, 5.4976806640625, 5.7392578125, 5.9808349609375, 6.222412109375, 6.4639892578125, 6.70556640625, 6.9471435546875, 7.188720703125, 7.4302978515625, 7.671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 1.0, 8.0, 19.0, 18.0, 29.0, 57.0, 65.0, 124.0, 217.0, 421.0, 958.0, 2697.0, 10459.0, 84935.0, 831366.0, 100837.0, 11540.0, 2857.0, 933.0, 425.0, 228.0, 137.0, 75.0, 44.0, 35.0, 21.0, 14.0, 12.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.26708984375, -1.2255859375, -1.18408203125, -1.142578125, -1.10107421875, -1.0595703125, -1.01806640625, -0.9765625, -0.93505859375, -0.8935546875, -0.85205078125, -0.810546875, -0.76904296875, -0.7275390625, -0.68603515625, -0.64453125, -0.60302734375, -0.5615234375, -0.52001953125, -0.478515625, -0.43701171875, -0.3955078125, -0.35400390625, -0.3125, -0.27099609375, -0.2294921875, -0.18798828125, -0.146484375, -0.10498046875, -0.0634765625, -0.02197265625, 0.01953125, 0.06103515625, 0.1025390625, 0.14404296875, 0.185546875, 0.22705078125, 0.2685546875, 0.31005859375, 0.3515625, 0.39306640625, 0.4345703125, 0.47607421875, 0.517578125, 0.55908203125, 0.6005859375, 0.64208984375, 0.68359375, 0.72509765625, 0.7666015625, 0.80810546875, 0.849609375, 0.89111328125, 0.9326171875, 0.97412109375, 1.015625, 1.05712890625, 1.0986328125, 1.14013671875, 1.181640625, 1.22314453125, 1.2646484375, 1.30615234375, 1.34765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 7.0, 9.0, 8.0, 14.0, 20.0, 28.0, 48.0, 54.0, 71.0, 104.0, 86.0, 120.0, 119.0, 79.0, 53.0, 36.0, 36.0, 20.0, 18.0, 17.0, 11.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023090839385986328, -0.00022430531680583954, -0.0002177022397518158, -0.00021109916269779205, -0.0002044960856437683, -0.00019789300858974457, -0.00019128993153572083, -0.00018468685448169708, -0.00017808377742767334, -0.0001714807003736496, -0.00016487762331962585, -0.0001582745462656021, -0.00015167146921157837, -0.00014506839215755463, -0.00013846531510353088, -0.00013186223804950714, -0.0001252591609954834, -0.00011865608394145966, -0.00011205300688743591, -0.00010544992983341217, -9.884685277938843e-05, -9.224377572536469e-05, -8.564069867134094e-05, -7.90376216173172e-05, -7.243454456329346e-05, -6.583146750926971e-05, -5.922839045524597e-05, -5.262531340122223e-05, -4.6022236347198486e-05, -3.9419159293174744e-05, -3.2816082239151e-05, -2.6213005185127258e-05, -1.9609928131103516e-05, -1.3006851077079773e-05, -6.40377402305603e-06, 1.993030309677124e-07, 6.802380084991455e-06, 1.3405457139015198e-05, 2.000853419303894e-05, 2.6611611247062683e-05, 3.3214688301086426e-05, 3.981776535511017e-05, 4.642084240913391e-05, 5.3023919463157654e-05, 5.9626996517181396e-05, 6.623007357120514e-05, 7.283315062522888e-05, 7.943622767925262e-05, 8.603930473327637e-05, 9.264238178730011e-05, 9.924545884132385e-05, 0.0001058485358953476, 0.00011245161294937134, 0.00011905469000339508, 0.00012565776705741882, 0.00013226084411144257, 0.0001388639211654663, 0.00014546699821949005, 0.0001520700752735138, 0.00015867315232753754, 0.00016527622938156128, 0.00017187930643558502, 0.00017848238348960876, 0.0001850854605436325, 0.00019168853759765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 15.0, 14.0, 15.0, 33.0, 42.0, 58.0, 108.0, 162.0, 273.0, 441.0, 1045.0, 2955.0, 12955.0, 105655.0, 788097.0, 116789.0, 14147.0, 3312.0, 1135.0, 517.0, 268.0, 160.0, 118.0, 73.0, 39.0, 25.0, 27.0, 17.0, 15.0, 7.0, 3.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.228515625, -1.1854400634765625, -1.142364501953125, -1.0992889404296875, -1.05621337890625, -1.0131378173828125, -0.970062255859375, -0.9269866943359375, -0.8839111328125, -0.8408355712890625, -0.797760009765625, -0.7546844482421875, -0.71160888671875, -0.6685333251953125, -0.625457763671875, -0.5823822021484375, -0.539306640625, -0.4962310791015625, -0.453155517578125, -0.4100799560546875, -0.36700439453125, -0.3239288330078125, -0.280853271484375, -0.2377777099609375, -0.1947021484375, -0.1516265869140625, -0.108551025390625, -0.0654754638671875, -0.02239990234375, 0.0206756591796875, 0.063751220703125, 0.1068267822265625, 0.14990234375, 0.1929779052734375, 0.236053466796875, 0.2791290283203125, 0.32220458984375, 0.3652801513671875, 0.408355712890625, 0.4514312744140625, 0.4945068359375, 0.5375823974609375, 0.580657958984375, 0.6237335205078125, 0.66680908203125, 0.7098846435546875, 0.752960205078125, 0.7960357666015625, 0.839111328125, 0.8821868896484375, 0.925262451171875, 0.9683380126953125, 1.01141357421875, 1.0544891357421875, 1.097564697265625, 1.1406402587890625, 1.1837158203125, 1.2267913818359375, 1.269866943359375, 1.3129425048828125, 1.35601806640625, 1.3990936279296875, 1.442169189453125, 1.4852447509765625, 1.5283203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 5.0, 4.0, 9.0, 9.0, 7.0, 9.0, 10.0, 14.0, 9.0, 14.0, 21.0, 28.0, 24.0, 43.0, 57.0, 66.0, 69.0, 90.0, 74.0, 98.0, 69.0, 51.0, 46.0, 30.0, 23.0, 25.0, 13.0, 8.0, 9.0, 11.0, 11.0, 3.0, 7.0, 6.0, 5.0, 0.0, 4.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.99267578125, -0.9608383178710938, -0.9290008544921875, -0.8971633911132812, -0.865325927734375, -0.8334884643554688, -0.8016510009765625, -0.7698135375976562, -0.73797607421875, -0.7061386108398438, -0.6743011474609375, -0.6424636840820312, -0.610626220703125, -0.5787887573242188, -0.5469512939453125, -0.5151138305664062, -0.4832763671875, -0.45143890380859375, -0.4196014404296875, -0.38776397705078125, -0.355926513671875, -0.32408905029296875, -0.2922515869140625, -0.26041412353515625, -0.22857666015625, -0.19673919677734375, -0.1649017333984375, -0.13306427001953125, -0.101226806640625, -0.06938934326171875, -0.0375518798828125, -0.00571441650390625, 0.026123046875, 0.05796051025390625, 0.0897979736328125, 0.12163543701171875, 0.153472900390625, 0.18531036376953125, 0.2171478271484375, 0.24898529052734375, 0.28082275390625, 0.31266021728515625, 0.3444976806640625, 0.37633514404296875, 0.408172607421875, 0.44001007080078125, 0.4718475341796875, 0.5036849975585938, 0.5355224609375, 0.5673599243164062, 0.5991973876953125, 0.6310348510742188, 0.662872314453125, 0.6947097778320312, 0.7265472412109375, 0.7583847045898438, 0.79022216796875, 0.8220596313476562, 0.8538970947265625, 0.8857345581054688, 0.917572021484375, 0.9494094848632812, 0.9812469482421875, 1.0130844116210938, 1.044921875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 16.0, 19.0, 23.0, 56.0, 101.0, 147.0, 209.0, 161.0, 113.0, 62.0, 37.0, 14.0, 16.0, 7.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.8845157623291, -20.003063201904297, -19.121610641479492, -18.240158081054688, -17.358705520629883, -16.477252960205078, -15.595800399780273, -14.714347839355469, -13.832895278930664, -12.95144271850586, -12.069990158081055, -11.18853759765625, -10.307085037231445, -9.42563247680664, -8.544179916381836, -7.662727355957031, -6.781274795532227, -5.899822235107422, -5.018369674682617, -4.1369171142578125, -3.255464553833008, -2.374011993408203, -1.4925594329833984, -0.6111068725585938, 0.27034568786621094, 1.1517982482910156, 2.0332508087158203, 2.914703369140625, 3.7961559295654297, 4.677608489990234, 5.559061050415039, 6.440513610839844, 7.321968078613281, 8.203420639038086, 9.08487319946289, 9.966325759887695, 10.8477783203125, 11.729230880737305, 12.61068344116211, 13.492136001586914, 14.373588562011719, 15.255041122436523, 16.136493682861328, 17.017946243286133, 17.899398803710938, 18.780851364135742, 19.662303924560547, 20.54375648498535, 21.425209045410156, 22.30666160583496, 23.188114166259766, 24.06956672668457, 24.951019287109375, 25.83247184753418, 26.713924407958984, 27.59537696838379, 28.476829528808594, 29.3582820892334, 30.239734649658203, 31.121187210083008, 32.00263977050781, 32.88409423828125, 33.76554489135742, 34.646995544433594, 35.52845001220703]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 8.0, 10.0, 13.0, 18.0, 20.0, 26.0, 29.0, 26.0, 33.0, 35.0, 54.0, 68.0, 82.0, 90.0, 88.0, 52.0, 51.0, 41.0, 46.0, 44.0, 24.0, 33.0, 19.0, 15.0, 13.0, 14.0, 13.0, 9.0, 7.0, 2.0, 1.0, 8.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.42766571044922, -23.746395111083984, -23.06512451171875, -22.383852005004883, -21.70258140563965, -21.021310806274414, -20.34004020690918, -19.658767700195312, -18.977497100830078, -18.296226501464844, -17.61495590209961, -16.933683395385742, -16.252412796020508, -15.571142196655273, -14.889871597290039, -14.208600044250488, -13.527329444885254, -12.84605884552002, -12.164787292480469, -11.483516693115234, -10.802245140075684, -10.12097454071045, -9.439702987670898, -8.758432388305664, -8.07716178894043, -7.395890712738037, -6.7146196365356445, -6.03334903717041, -5.352077484130859, -4.670806884765625, -3.9895358085632324, -3.30826473236084, -2.626993179321289, -1.9457221031188965, -1.2644511461257935, -0.5831801891326904, 0.09809088706970215, 0.7793619632720947, 1.4606328010559082, 2.141903877258301, 2.8231749534606934, 3.504446029663086, 4.1857171058654785, 4.866988182067871, 5.5482587814331055, 6.229530334472656, 6.910800933837891, 7.592072010040283, 8.273343086242676, 8.95461368560791, 9.635885238647461, 10.317155838012695, 10.998427391052246, 11.67969799041748, 12.360969543457031, 13.042240142822266, 13.7235107421875, 14.404781341552734, 15.086052894592285, 15.76732349395752, 16.44859504699707, 17.129865646362305, 17.81113624572754, 18.492408752441406, 19.17367935180664]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 4.0, 6.0, 9.0, 7.0, 12.0, 15.0, 15.0, 15.0, 14.0, 18.0, 24.0, 16.0, 34.0, 41.0, 68.0, 179.0, 199.0, 78.0, 45.0, 31.0, 31.0, 25.0, 22.0, 24.0, 15.0, 12.0, 12.0, 6.0, 3.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.11322021484375, -2.0174560546875, -1.92169189453125, -1.825927734375, -1.73016357421875, -1.6343994140625, -1.53863525390625, -1.44287109375, -1.34710693359375, -1.2513427734375, -1.15557861328125, -1.059814453125, -0.96405029296875, -0.8682861328125, -0.77252197265625, -0.6767578125, -0.58099365234375, -0.4852294921875, -0.38946533203125, -0.293701171875, -0.19793701171875, -0.1021728515625, -0.00640869140625, 0.08935546875, 0.18511962890625, 0.2808837890625, 0.37664794921875, 0.472412109375, 0.56817626953125, 0.6639404296875, 0.75970458984375, 0.85546875, 0.95123291015625, 1.0469970703125, 1.14276123046875, 1.238525390625, 1.33428955078125, 1.4300537109375, 1.52581787109375, 1.62158203125, 1.71734619140625, 1.8131103515625, 1.90887451171875, 2.004638671875, 2.10040283203125, 2.1961669921875, 2.29193115234375, 2.3876953125, 2.48345947265625, 2.5792236328125, 2.67498779296875, 2.770751953125, 2.86651611328125, 2.9622802734375, 3.05804443359375, 3.15380859375, 3.24957275390625, 3.3453369140625, 3.44110107421875, 3.536865234375, 3.63262939453125, 3.7283935546875, 3.82415771484375, 3.919921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 3.0, 8.0, 7.0, 4.0, 9.0, 6.0, 16.0, 21.0, 30.0, 62.0, 62.0, 121.0, 188.0, 290.0, 556.0, 1105.0, 2347.0, 5733.0, 18648.0, 7712430.0, 621108.0, 15993.0, 5171.0, 2158.0, 1051.0, 562.0, 297.0, 197.0, 128.0, 71.0, 50.0, 44.0, 30.0, 23.0, 13.0, 12.0, 7.0, 11.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-9.680540084838867, -9.425344467163086, -9.170148849487305, -8.91495418548584, -8.659758567810059, -8.404562950134277, -8.149367332458496, -7.894171714782715, -7.638976573944092, -7.3837809562683105, -7.1285858154296875, -6.873390197753906, -6.618194580078125, -6.362999439239502, -6.107803821563721, -5.852608680725098, -5.597413063049316, -5.342217445373535, -5.087022304534912, -4.831826686859131, -4.576631546020508, -4.321435928344727, -4.066240310668945, -3.811044931411743, -3.555849552154541, -3.300654172897339, -3.0454587936401367, -2.7902631759643555, -2.5350677967071533, -2.279872417449951, -2.02467679977417, -1.7694814205169678, -1.5142860412597656, -1.2590906620025635, -1.0038951635360718, -0.7486997246742249, -0.49350428581237793, -0.23830890655517578, 0.016886591911315918, 0.2720820903778076, 0.5272774696350098, 0.7824729084968567, 1.0376683473587036, 1.2928638458251953, 1.5480592250823975, 1.8032546043395996, 2.058450222015381, 2.313645601272583, 2.568840980529785, 2.8240363597869873, 3.0792317390441895, 3.3344273567199707, 3.589622735977173, 3.844818115234375, 4.100013732910156, 4.3552093505859375, 4.6104044914245605, 4.865600109100342, 5.120795249938965, 5.375990867614746, 5.631186485290527, 5.88638162612915, 6.141577243804932, 6.396772384643555, 6.651968002319336]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 3.0, 7.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 7.0, 3.0, 0.0, 6.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.560235977172852, -13.227935791015625, -12.895635604858398, -12.563334465026855, -12.231034278869629, -11.898734092712402, -11.56643295288086, -11.234132766723633, -10.901832580566406, -10.56953239440918, -10.237232208251953, -9.90493106842041, -9.572630882263184, -9.240330696105957, -8.908029556274414, -8.575729370117188, -8.243429183959961, -7.911128997802734, -7.57882833480835, -7.246527671813965, -6.914227485656738, -6.581927299499512, -6.249626636505127, -5.917325973510742, -5.585025787353516, -5.252725601196289, -4.920424938201904, -4.5881242752075195, -4.255824089050293, -3.9235236644744873, -3.5912232398986816, -3.258922815322876, -2.9266233444213867, -2.594322919845581, -2.2620224952697754, -1.9297220706939697, -1.597421646118164, -1.2651212215423584, -0.9328207969665527, -0.6005203723907471, -0.2682199478149414, 0.06408047676086426, 0.3963809013366699, 0.7286813259124756, 1.0609817504882812, 1.393282175064087, 1.7255825996398926, 2.0578830242156982, 2.390183448791504, 2.7224838733673096, 3.0547842979431152, 3.387084722518921, 3.7193851470947266, 4.051685333251953, 4.383985996246338, 4.716286659240723, 5.048586845397949, 5.380887031555176, 5.7131876945495605, 6.045488357543945, 6.377788543701172, 6.710088729858398, 7.042389392852783, 7.374690055847168, 7.7069902420043945]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 9.0, 14.0, 9.0, 17.0, 22.0, 21.0, 36.0, 49.0, 38.0, 40.0, 50.0, 54.0, 62.0, 67.0, 50.0, 68.0, 43.0, 54.0, 49.0, 41.0, 42.0, 31.0, 28.0, 20.0, 20.0, 13.0, 11.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6775970458984375, -1.615936279296875, -1.5542755126953125, -1.49261474609375, -1.4309539794921875, -1.369293212890625, -1.3076324462890625, -1.2459716796875, -1.1843109130859375, -1.122650146484375, -1.0609893798828125, -0.99932861328125, -0.9376678466796875, -0.876007080078125, -0.8143463134765625, -0.752685546875, -0.6910247802734375, -0.629364013671875, -0.5677032470703125, -0.50604248046875, -0.4443817138671875, -0.382720947265625, -0.3210601806640625, -0.2593994140625, -0.1977386474609375, -0.136077880859375, -0.0744171142578125, -0.01275634765625, 0.0489044189453125, 0.110565185546875, 0.1722259521484375, 0.23388671875, 0.2955474853515625, 0.357208251953125, 0.4188690185546875, 0.48052978515625, 0.5421905517578125, 0.603851318359375, 0.6655120849609375, 0.7271728515625, 0.7888336181640625, 0.850494384765625, 0.9121551513671875, 0.97381591796875, 1.0354766845703125, 1.097137451171875, 1.1587982177734375, 1.220458984375, 1.2821197509765625, 1.343780517578125, 1.4054412841796875, 1.46710205078125, 1.5287628173828125, 1.590423583984375, 1.6520843505859375, 1.7137451171875, 1.7754058837890625, 1.837066650390625, 1.8987274169921875, 1.96038818359375, 2.0220489501953125, 2.083709716796875, 2.1453704833984375, 2.20703125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 7.0, 15.0, 16.0, 29.0, 37.0, 38.0, 54.0, 86.0, 111.0, 167.0, 237.0, 386.0, 562.0, 900.0, 1435.0, 2421.0, 4320.0, 8164.0, 16082.0, 37164.0, 108040.0, 194094.0, 86599.0, 31541.0, 14412.0, 7271.0, 4041.0, 2272.0, 1291.0, 792.0, 524.0, 330.0, 243.0, 169.0, 113.0, 77.0, 62.0, 36.0, 25.0, 19.0, 17.0, 13.0, 11.0, 5.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.5, -23.719970703125, -22.93994140625, -22.159912109375, -21.3798828125, -20.599853515625, -19.81982421875, -19.039794921875, -18.259765625, -17.479736328125, -16.69970703125, -15.919677734375, -15.1396484375, -14.359619140625, -13.57958984375, -12.799560546875, -12.01953125, -11.239501953125, -10.45947265625, -9.679443359375, -8.8994140625, -8.119384765625, -7.33935546875, -6.559326171875, -5.779296875, -4.999267578125, -4.21923828125, -3.439208984375, -2.6591796875, -1.879150390625, -1.09912109375, -0.319091796875, 0.4609375, 1.240966796875, 2.02099609375, 2.801025390625, 3.5810546875, 4.361083984375, 5.14111328125, 5.921142578125, 6.701171875, 7.481201171875, 8.26123046875, 9.041259765625, 9.8212890625, 10.601318359375, 11.38134765625, 12.161376953125, 12.94140625, 13.721435546875, 14.50146484375, 15.281494140625, 16.0615234375, 16.841552734375, 17.62158203125, 18.401611328125, 19.181640625, 19.961669921875, 20.74169921875, 21.521728515625, 22.3017578125, 23.081787109375, 23.86181640625, 24.641845703125, 25.421875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 4.0, 7.0, 14.0, 19.0, 17.0, 21.0, 35.0, 28.0, 42.0, 37.0, 37.0, 50.0, 35.0, 58.0, 52.0, 49.0, 50.0, 46.0, 45.0, 50.0, 42.0, 50.0, 24.0, 31.0, 32.0, 18.0, 17.0, 10.0, 6.0, 16.0, 11.0, 6.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.431640625, -2.346435546875, -2.26123046875, -2.176025390625, -2.0908203125, -2.005615234375, -1.92041015625, -1.835205078125, -1.75, -1.664794921875, -1.57958984375, -1.494384765625, -1.4091796875, -1.323974609375, -1.23876953125, -1.153564453125, -1.068359375, -0.983154296875, -0.89794921875, -0.812744140625, -0.7275390625, -0.642333984375, -0.55712890625, -0.471923828125, -0.38671875, -0.301513671875, -0.21630859375, -0.131103515625, -0.0458984375, 0.039306640625, 0.12451171875, 0.209716796875, 0.294921875, 0.380126953125, 0.46533203125, 0.550537109375, 0.6357421875, 0.720947265625, 0.80615234375, 0.891357421875, 0.9765625, 1.061767578125, 1.14697265625, 1.232177734375, 1.3173828125, 1.402587890625, 1.48779296875, 1.572998046875, 1.658203125, 1.743408203125, 1.82861328125, 1.913818359375, 1.9990234375, 2.084228515625, 2.16943359375, 2.254638671875, 2.33984375, 2.425048828125, 2.51025390625, 2.595458984375, 2.6806640625, 2.765869140625, 2.85107421875, 2.936279296875, 3.021484375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 5.0, 12.0, 5.0, 30.0, 39.0, 55.0, 73.0, 79.0, 64.0, 32.0, 25.0, 12.0, 8.0, 10.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.080479621887207, -10.668635368347168, -10.256791114807129, -9.84494686126709, -9.433103561401367, -9.021259307861328, -8.609415054321289, -8.19757080078125, -7.785726547241211, -7.373882293701172, -6.962038040161133, -6.550194263458252, -6.138350009918213, -5.726505756378174, -5.314661979675293, -4.902817726135254, -4.490973472595215, -4.079129219055176, -3.667285203933716, -3.255441188812256, -2.843596935272217, -2.4317526817321777, -2.0199086666107178, -1.6080646514892578, -1.1962203979492188, -0.7843762636184692, -0.3725321292877197, 0.039312005043029785, 0.4511561393737793, 0.8630003929138184, 1.2748444080352783, 1.6866884231567383, 2.098531723022461, 2.5103759765625, 2.92221999168396, 3.33406400680542, 3.745908260345459, 4.157752513885498, 4.569596290588379, 4.981440544128418, 5.393284797668457, 5.805129051208496, 6.216973304748535, 6.628817081451416, 7.040661334991455, 7.452505588531494, 7.864349365234375, 8.276193618774414, 8.688037872314453, 9.099882125854492, 9.511726379394531, 9.92357063293457, 10.33541488647461, 10.747259140014648, 11.159102439880371, 11.57094669342041, 11.98279094696045, 12.394635200500488, 12.806479454040527, 13.218323707580566, 13.630167007446289, 14.042011260986328, 14.453855514526367, 14.865699768066406, 15.277544021606445]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 5.0, 9.0, 9.0, 11.0, 13.0, 12.0, 22.0, 40.0, 91.0, 116.0, 35.0, 21.0, 16.0, 10.0, 7.0, 14.0, 11.0, 4.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.910449981689453, -11.47547721862793, -11.040504455566406, -10.605531692504883, -10.17055892944336, -9.735586166381836, -9.300613403320312, -8.865640640258789, -8.430667877197266, -7.995695114135742, -7.560722351074219, -7.125749588012695, -6.690776824951172, -6.255804061889648, -5.820830821990967, -5.385858058929443, -4.950884819030762, -4.515912055969238, -4.080939292907715, -3.6459662914276123, -3.210993528366089, -2.7760207653045654, -2.341047763824463, -1.9060750007629395, -1.471102237701416, -1.0361294746398926, -0.6011565923690796, -0.1661837100982666, 0.26878905296325684, 0.7037618160247803, 1.1387348175048828, 1.5737075805664062, 2.0086793899536133, 2.4436521530151367, 2.87862491607666, 3.3135979175567627, 3.748570680618286, 4.1835432052612305, 4.618516445159912, 5.0534892082214355, 5.488461971282959, 5.923434734344482, 6.358407497406006, 6.7933807373046875, 7.228353500366211, 7.663326263427734, 8.098299026489258, 8.533271789550781, 8.968244552612305, 9.403217315673828, 9.838190078735352, 10.273162841796875, 10.708135604858398, 11.143108367919922, 11.578081130981445, 12.013053894042969, 12.448026657104492, 12.882999420166016, 13.317972183227539, 13.752944946289062, 14.187917709350586, 14.62289047241211, 15.057863235473633, 15.492835998535156, 15.927809715270996]}, "eval/loss": 1.642454743385315, "eval/bleu": 2.691896075803751e-15, "eval/runtime": 2632.4174, "eval/samples_per_second": 5.607, "eval/steps_per_second": 0.701, "train/train_runtime": 95217.2299, "train/train_samples_per_second": 6.534, "train/train_steps_per_second": 0.102, "train/total_flos": 0.0, "train/train_loss": 1.7970677693255643, "_wandb": {"runtime": 95577}} \ No newline at end of file