diff --git "a/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" "b/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220324_170220-1u8cita3/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 0.3575, "train/learning_rate": 6.0676056338028176e-06, "train/epoch": 20.18, "train/global_step": 18000, "_runtime": 10029, "_timestamp": 1648151369, "_step": 1500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 4.0, 9.0, 13.0, 11.0, 7.0, 16.0, 20.0, 10.0, 23.0, 18.0, 25.0, 20.0, 23.0, 25.0, 29.0, 26.0, 24.0, 35.0, 39.0, 32.0, 44.0, 37.0, 37.0, 36.0, 35.0, 33.0, 31.0, 30.0, 42.0, 20.0, 20.0, 26.0, 22.0, 21.0, 17.0, 17.0, 15.0, 15.0, 12.0, 13.0, 11.0, 8.0, 8.0, 5.0, 0.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 4.0, 1.0], "bins": [-5.804027557373047, -5.677530765533447, -5.551033973693848, -5.424537658691406, -5.298040866851807, -5.171544075012207, -5.045047283172607, -4.918550491333008, -4.792053699493408, -4.665556907653809, -4.539060115814209, -4.412563323974609, -4.286067008972168, -4.159570217132568, -4.033073425292969, -3.906576633453369, -3.7800800800323486, -3.653583288192749, -3.5270867347717285, -3.400589942932129, -3.2740931510925293, -3.1475963592529297, -3.021099805831909, -2.8946030139923096, -2.768106460571289, -2.6416096687316895, -2.515113115310669, -2.3886163234710693, -2.2621195316314697, -2.135622978210449, -2.0091261863708496, -1.88262939453125, -1.7561326026916504, -1.6296359300613403, -1.5031391382217407, -1.3766424655914307, -1.250145673751831, -1.123649001121521, -0.9971523284912109, -0.8706555962562561, -0.7441588640213013, -0.6176621317863464, -0.491165429353714, -0.36466872692108154, -0.2381719946861267, -0.11167526245117188, 0.014821410179138184, 0.14131814241409302, 0.26781487464904785, 0.3943116068840027, 0.5208083391189575, 0.6473050117492676, 0.7738017439842224, 0.9002984762191772, 1.0267951488494873, 1.153291940689087, 1.279788613319397, 1.406285285949707, 1.5327820777893066, 1.6592787504196167, 1.7857754230499268, 1.9122722148895264, 2.038768768310547, 2.1652655601501465, 2.291762351989746]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 8.0, 9.0, 5.0, 6.0, 9.0, 9.0, 12.0, 12.0, 24.0, 28.0, 22.0, 25.0, 27.0, 38.0, 26.0, 33.0, 35.0, 40.0, 35.0, 33.0, 44.0, 41.0, 40.0, 43.0, 39.0, 32.0, 46.0, 36.0, 37.0, 25.0, 34.0, 25.0, 18.0, 22.0, 16.0, 14.0, 11.0, 10.0, 4.0, 4.0, 1.0, 10.0, 4.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.996482849121094, -4.8410186767578125, -4.685554027557373, -4.530089855194092, -4.3746256828308105, -4.219161033630371, -4.06369686126709, -3.9082326889038086, -3.7527682781219482, -3.597303867340088, -3.4418396949768066, -3.2863752841949463, -3.130910873413086, -2.9754467010498047, -2.8199822902679443, -2.664517879486084, -2.5090537071228027, -2.3535892963409424, -2.198125123977661, -2.042660713195801, -1.88719642162323, -1.7317321300506592, -1.5762677192687988, -1.420803427696228, -1.2653391361236572, -1.1098748445510864, -0.9544104933738708, -0.7989461421966553, -0.6434818506240845, -0.48801755905151367, -0.3325532078742981, -0.17708885669708252, -0.02162456512451172, 0.13383975625038147, 0.28930407762527466, 0.44476839900016785, 0.600232720375061, 0.7556970119476318, 0.9111613631248474, 1.066625714302063, 1.2220900058746338, 1.3775542974472046, 1.5330185890197754, 1.6884829998016357, 1.8439472913742065, 1.9994115829467773, 2.1548759937286377, 2.310340404510498, 2.4658045768737793, 2.6212689876556396, 2.776733160018921, 2.9321975708007812, 3.0876617431640625, 3.243126153945923, 3.398590564727783, 3.5540547370910645, 3.709519147872925, 3.864983558654785, 4.020447731018066, 4.175911903381348, 4.331376552581787, 4.486840724945068, 4.64230489730835, 4.797769546508789, 4.95323371887207]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 18.0, 15.0, 37.0, 65.0, 78.0, 140.0, 291.0, 512.0, 889.0, 1796.0, 3329.0, 6334.0, 11740.0, 21683.0, 40497.0, 74106.0, 135479.0, 238646.0, 402749.0, 612553.0, 755698.0, 696497.0, 496211.0, 305033.0, 176310.0, 97694.0, 53623.0, 28979.0, 15399.0, 8348.0, 4432.0, 2349.0, 1271.0, 663.0, 345.0, 203.0, 127.0, 58.0, 43.0, 16.0, 16.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.125, -7.88409423828125, -7.6431884765625, -7.40228271484375, -7.161376953125, -6.92047119140625, -6.6795654296875, -6.43865966796875, -6.19775390625, -5.95684814453125, -5.7159423828125, -5.47503662109375, -5.234130859375, -4.99322509765625, -4.7523193359375, -4.51141357421875, -4.2705078125, -4.02960205078125, -3.7886962890625, -3.54779052734375, -3.306884765625, -3.06597900390625, -2.8250732421875, -2.58416748046875, -2.34326171875, -2.10235595703125, -1.8614501953125, -1.62054443359375, -1.379638671875, -1.13873291015625, -0.8978271484375, -0.65692138671875, -0.416015625, -0.17510986328125, 0.0657958984375, 0.30670166015625, 0.547607421875, 0.78851318359375, 1.0294189453125, 1.27032470703125, 1.51123046875, 1.75213623046875, 1.9930419921875, 2.23394775390625, 2.474853515625, 2.71575927734375, 2.9566650390625, 3.19757080078125, 3.4384765625, 3.67938232421875, 3.9202880859375, 4.16119384765625, 4.402099609375, 4.64300537109375, 4.8839111328125, 5.12481689453125, 5.36572265625, 5.60662841796875, 5.8475341796875, 6.08843994140625, 6.329345703125, 6.57025146484375, 6.8111572265625, 7.05206298828125, 7.29296875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 5.0, 7.0, 11.0, 7.0, 12.0, 15.0, 18.0, 13.0, 27.0, 28.0, 25.0, 28.0, 30.0, 35.0, 41.0, 36.0, 31.0, 47.0, 37.0, 36.0, 39.0, 48.0, 40.0, 37.0, 32.0, 35.0, 38.0, 37.0, 33.0, 18.0, 21.0, 18.0, 15.0, 22.0, 10.0, 7.0, 7.0, 13.0, 11.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.25390625, -5.09320068359375, -4.9324951171875, -4.77178955078125, -4.611083984375, -4.45037841796875, -4.2896728515625, -4.12896728515625, -3.96826171875, -3.80755615234375, -3.6468505859375, -3.48614501953125, -3.325439453125, -3.16473388671875, -3.0040283203125, -2.84332275390625, -2.6826171875, -2.52191162109375, -2.3612060546875, -2.20050048828125, -2.039794921875, -1.87908935546875, -1.7183837890625, -1.55767822265625, -1.39697265625, -1.23626708984375, -1.0755615234375, -0.91485595703125, -0.754150390625, -0.59344482421875, -0.4327392578125, -0.27203369140625, -0.111328125, 0.04937744140625, 0.2100830078125, 0.37078857421875, 0.531494140625, 0.69219970703125, 0.8529052734375, 1.01361083984375, 1.17431640625, 1.33502197265625, 1.4957275390625, 1.65643310546875, 1.817138671875, 1.97784423828125, 2.1385498046875, 2.29925537109375, 2.4599609375, 2.62066650390625, 2.7813720703125, 2.94207763671875, 3.102783203125, 3.26348876953125, 3.4241943359375, 3.58489990234375, 3.74560546875, 3.90631103515625, 4.0670166015625, 4.22772216796875, 4.388427734375, 4.54913330078125, 4.7098388671875, 4.87054443359375, 5.03125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 7.0, 4.0, 7.0, 20.0, 24.0, 44.0, 76.0, 126.0, 216.0, 374.0, 672.0, 1182.0, 2078.0, 3602.0, 6127.0, 10894.0, 18600.0, 32425.0, 56430.0, 94456.0, 156533.0, 249803.0, 374700.0, 514612.0, 616470.0, 608615.0, 497588.0, 355256.0, 235407.0, 146647.0, 88147.0, 52043.0, 30056.0, 17455.0, 10149.0, 5580.0, 3308.0, 1872.0, 1166.0, 664.0, 354.0, 220.0, 110.0, 78.0, 53.0, 18.0, 13.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.069580078125, -4.88134765625, -4.693115234375, -4.5048828125, -4.316650390625, -4.12841796875, -3.940185546875, -3.751953125, -3.563720703125, -3.37548828125, -3.187255859375, -2.9990234375, -2.810791015625, -2.62255859375, -2.434326171875, -2.24609375, -2.057861328125, -1.86962890625, -1.681396484375, -1.4931640625, -1.304931640625, -1.11669921875, -0.928466796875, -0.740234375, -0.552001953125, -0.36376953125, -0.175537109375, 0.0126953125, 0.200927734375, 0.38916015625, 0.577392578125, 0.765625, 0.953857421875, 1.14208984375, 1.330322265625, 1.5185546875, 1.706787109375, 1.89501953125, 2.083251953125, 2.271484375, 2.459716796875, 2.64794921875, 2.836181640625, 3.0244140625, 3.212646484375, 3.40087890625, 3.589111328125, 3.77734375, 3.965576171875, 4.15380859375, 4.342041015625, 4.5302734375, 4.718505859375, 4.90673828125, 5.094970703125, 5.283203125, 5.471435546875, 5.65966796875, 5.847900390625, 6.0361328125, 6.224365234375, 6.41259765625, 6.600830078125, 6.7890625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 2.0, 11.0, 14.0, 14.0, 17.0, 26.0, 27.0, 38.0, 58.0, 47.0, 86.0, 87.0, 102.0, 108.0, 157.0, 165.0, 186.0, 210.0, 227.0, 229.0, 245.0, 222.0, 226.0, 208.0, 228.0, 178.0, 149.0, 153.0, 106.0, 98.0, 95.0, 74.0, 48.0, 46.0, 43.0, 31.0, 23.0, 25.0, 14.0, 12.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.609375, -2.52978515625, -2.4501953125, -2.37060546875, -2.291015625, -2.21142578125, -2.1318359375, -2.05224609375, -1.97265625, -1.89306640625, -1.8134765625, -1.73388671875, -1.654296875, -1.57470703125, -1.4951171875, -1.41552734375, -1.3359375, -1.25634765625, -1.1767578125, -1.09716796875, -1.017578125, -0.93798828125, -0.8583984375, -0.77880859375, -0.69921875, -0.61962890625, -0.5400390625, -0.46044921875, -0.380859375, -0.30126953125, -0.2216796875, -0.14208984375, -0.0625, 0.01708984375, 0.0966796875, 0.17626953125, 0.255859375, 0.33544921875, 0.4150390625, 0.49462890625, 0.57421875, 0.65380859375, 0.7333984375, 0.81298828125, 0.892578125, 0.97216796875, 1.0517578125, 1.13134765625, 1.2109375, 1.29052734375, 1.3701171875, 1.44970703125, 1.529296875, 1.60888671875, 1.6884765625, 1.76806640625, 1.84765625, 1.92724609375, 2.0068359375, 2.08642578125, 2.166015625, 2.24560546875, 2.3251953125, 2.40478515625, 2.484375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 10.0, 9.0, 8.0, 7.0, 16.0, 16.0, 25.0, 22.0, 25.0, 30.0, 31.0, 27.0, 30.0, 31.0, 41.0, 39.0, 42.0, 54.0, 48.0, 45.0, 43.0, 38.0, 37.0, 47.0, 41.0, 29.0, 31.0, 21.0, 20.0, 20.0, 19.0, 18.0, 11.0, 12.0, 5.0, 10.0, 5.0, 6.0, 8.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.882208824157715, -5.70045280456543, -5.518697261810303, -5.336941242218018, -5.155185222625732, -4.9734296798706055, -4.79167366027832, -4.609917640686035, -4.42816162109375, -4.246405601501465, -4.064650058746338, -3.8828940391540527, -3.7011380195617676, -3.5193822383880615, -3.3376264572143555, -3.1558704376220703, -2.9741148948669434, -2.7923591136932373, -2.610603094100952, -2.428847312927246, -2.247091293334961, -2.065335512161255, -1.8835797309875488, -1.7018238306045532, -1.5200679302215576, -1.338312029838562, -1.1565561294555664, -0.9748003482818604, -0.7930444478988647, -0.6112885475158691, -0.4295327663421631, -0.24777686595916748, -0.06602096557617188, 0.11573490500450134, 0.29749077558517456, 0.4792466163635254, 0.661002516746521, 0.8427584171295166, 1.0245141983032227, 1.2062700986862183, 1.3880259990692139, 1.5697818994522095, 1.751537799835205, 1.9332935810089111, 2.115049362182617, 2.2968053817749023, 2.4785611629486084, 2.6603169441223145, 2.8420729637145996, 3.0238287448883057, 3.205584764480591, 3.387340545654297, 3.569096565246582, 3.750852346420288, 3.932608127593994, 4.114364147186279, 4.296119689941406, 4.477875709533691, 4.659631252288818, 4.8413872718811035, 5.023143291473389, 5.204898834228516, 5.386654853820801, 5.568410873413086, 5.750166893005371]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 6.0, 10.0, 12.0, 13.0, 13.0, 15.0, 15.0, 21.0, 20.0, 20.0, 24.0, 18.0, 40.0, 30.0, 30.0, 35.0, 49.0, 38.0, 50.0, 52.0, 39.0, 38.0, 36.0, 36.0, 34.0, 37.0, 35.0, 30.0, 34.0, 20.0, 23.0, 19.0, 18.0, 15.0, 11.0, 10.0, 7.0, 8.0, 7.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.798727035522461, -5.615190029144287, -5.431652545928955, -5.248115539550781, -5.064578056335449, -4.881041049957275, -4.697504043579102, -4.5139665603637695, -4.330429553985596, -4.146892547607422, -3.96335506439209, -3.779818058013916, -3.596280813217163, -3.41274356842041, -3.2292063236236572, -3.0456690788269043, -2.8621318340301514, -2.6785945892333984, -2.4950573444366455, -2.3115200996398926, -2.1279830932617188, -1.9444458484649658, -1.760908603668213, -1.5773714780807495, -1.3938342332839966, -1.2102969884872437, -1.0267598628997803, -0.8432226181030273, -0.6596854329109192, -0.47614824771881104, -0.2926110029220581, -0.10907387733459473, 0.0744633674621582, 0.25800055265426636, 0.4415377676486969, 0.6250749826431274, 0.8086121678352356, 0.9921493530273438, 1.1756865978240967, 1.35922372341156, 1.542760968208313, 1.726298213005066, 1.9098353385925293, 2.0933725833892822, 2.276909828186035, 2.460446834564209, 2.643984317779541, 2.827521324157715, 3.0110585689544678, 3.1945958137512207, 3.3781330585479736, 3.5616703033447266, 3.7452073097229004, 3.9287445545196533, 4.112281799316406, 4.29581880569458, 4.479356288909912, 4.662893295288086, 4.846430778503418, 5.029967784881592, 5.213505268096924, 5.397042274475098, 5.58057975769043, 5.7641167640686035, 5.947653770446777]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 7.0, 1.0, 6.0, 7.0, 8.0, 12.0, 29.0, 21.0, 38.0, 53.0, 64.0, 87.0, 143.0, 208.0, 268.0, 380.0, 576.0, 892.0, 1381.0, 2050.0, 3430.0, 5639.0, 9601.0, 16747.0, 29856.0, 53100.0, 92977.0, 151356.0, 201810.0, 184069.0, 123881.0, 73034.0, 40806.0, 23062.0, 13089.0, 7383.0, 4487.0, 2651.0, 1809.0, 1138.0, 729.0, 530.0, 337.0, 236.0, 166.0, 122.0, 93.0, 53.0, 52.0, 32.0, 16.0, 15.0, 11.0, 8.0, 5.0, 3.0, 3.0], "bins": [-3.1171875, -3.030059814453125, -2.94293212890625, -2.855804443359375, -2.7686767578125, -2.681549072265625, -2.59442138671875, -2.507293701171875, -2.420166015625, -2.333038330078125, -2.24591064453125, -2.158782958984375, -2.0716552734375, -1.984527587890625, -1.89739990234375, -1.810272216796875, -1.72314453125, -1.636016845703125, -1.54888916015625, -1.461761474609375, -1.3746337890625, -1.287506103515625, -1.20037841796875, -1.113250732421875, -1.026123046875, -0.938995361328125, -0.85186767578125, -0.764739990234375, -0.6776123046875, -0.590484619140625, -0.50335693359375, -0.416229248046875, -0.3291015625, -0.241973876953125, -0.15484619140625, -0.067718505859375, 0.0194091796875, 0.106536865234375, 0.19366455078125, 0.280792236328125, 0.367919921875, 0.455047607421875, 0.54217529296875, 0.629302978515625, 0.7164306640625, 0.803558349609375, 0.89068603515625, 0.977813720703125, 1.06494140625, 1.152069091796875, 1.23919677734375, 1.326324462890625, 1.4134521484375, 1.500579833984375, 1.58770751953125, 1.674835205078125, 1.761962890625, 1.849090576171875, 1.93621826171875, 2.023345947265625, 2.1104736328125, 2.197601318359375, 2.28472900390625, 2.371856689453125, 2.458984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 5.0, 11.0, 9.0, 11.0, 11.0, 9.0, 10.0, 11.0, 18.0, 20.0, 22.0, 33.0, 22.0, 33.0, 28.0, 21.0, 36.0, 46.0, 32.0, 35.0, 27.0, 37.0, 51.0, 55.0, 36.0, 41.0, 29.0, 32.0, 32.0, 31.0, 22.0, 20.0, 24.0, 20.0, 18.0, 18.0, 12.0, 17.0, 5.0, 9.0, 10.0, 5.0, 6.0, 3.0, 6.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.72265625, -5.54058837890625, -5.3585205078125, -5.17645263671875, -4.994384765625, -4.81231689453125, -4.6302490234375, -4.44818115234375, -4.26611328125, -4.08404541015625, -3.9019775390625, -3.71990966796875, -3.537841796875, -3.35577392578125, -3.1737060546875, -2.99163818359375, -2.8095703125, -2.62750244140625, -2.4454345703125, -2.26336669921875, -2.081298828125, -1.89923095703125, -1.7171630859375, -1.53509521484375, -1.35302734375, -1.17095947265625, -0.9888916015625, -0.80682373046875, -0.624755859375, -0.44268798828125, -0.2606201171875, -0.07855224609375, 0.103515625, 0.28558349609375, 0.4676513671875, 0.64971923828125, 0.831787109375, 1.01385498046875, 1.1959228515625, 1.37799072265625, 1.56005859375, 1.74212646484375, 1.9241943359375, 2.10626220703125, 2.288330078125, 2.47039794921875, 2.6524658203125, 2.83453369140625, 3.0166015625, 3.19866943359375, 3.3807373046875, 3.56280517578125, 3.744873046875, 3.92694091796875, 4.1090087890625, 4.29107666015625, 4.47314453125, 4.65521240234375, 4.8372802734375, 5.01934814453125, 5.201416015625, 5.38348388671875, 5.5655517578125, 5.74761962890625, 5.9296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 7.0, 9.0, 9.0, 24.0, 25.0, 35.0, 54.0, 67.0, 149.0, 220.0, 452.0, 927.0, 2061.0, 5950.0, 20037.0, 233862.0, 747029.0, 25793.0, 7005.0, 2552.0, 1075.0, 525.0, 264.0, 124.0, 76.0, 59.0, 40.0, 25.0, 29.0, 15.0, 11.0, 9.0, 10.0, 4.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.5672607421875, -9.259521484375, -8.9517822265625, -8.64404296875, -8.3363037109375, -8.028564453125, -7.7208251953125, -7.4130859375, -7.1053466796875, -6.797607421875, -6.4898681640625, -6.18212890625, -5.8743896484375, -5.566650390625, -5.2589111328125, -4.951171875, -4.6434326171875, -4.335693359375, -4.0279541015625, -3.72021484375, -3.4124755859375, -3.104736328125, -2.7969970703125, -2.4892578125, -2.1815185546875, -1.873779296875, -1.5660400390625, -1.25830078125, -0.9505615234375, -0.642822265625, -0.3350830078125, -0.02734375, 0.2803955078125, 0.588134765625, 0.8958740234375, 1.20361328125, 1.5113525390625, 1.819091796875, 2.1268310546875, 2.4345703125, 2.7423095703125, 3.050048828125, 3.3577880859375, 3.66552734375, 3.9732666015625, 4.281005859375, 4.5887451171875, 4.896484375, 5.2042236328125, 5.511962890625, 5.8197021484375, 6.12744140625, 6.4351806640625, 6.742919921875, 7.0506591796875, 7.3583984375, 7.6661376953125, 7.973876953125, 8.2816162109375, 8.58935546875, 8.8970947265625, 9.204833984375, 9.5125732421875, 9.8203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 3.0, 6.0, 10.0, 9.0, 10.0, 9.0, 15.0, 22.0, 24.0, 26.0, 18.0, 40.0, 33.0, 32.0, 49.0, 27.0, 42.0, 40.0, 36.0, 47.0, 38.0, 36.0, 36.0, 33.0, 28.0, 34.0, 30.0, 28.0, 28.0, 24.0, 31.0, 22.0, 19.0, 24.0, 22.0, 8.0, 9.0, 9.0, 7.0, 8.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-4.7421875, -4.6048583984375, -4.467529296875, -4.3302001953125, -4.19287109375, -4.0555419921875, -3.918212890625, -3.7808837890625, -3.6435546875, -3.5062255859375, -3.368896484375, -3.2315673828125, -3.09423828125, -2.9569091796875, -2.819580078125, -2.6822509765625, -2.544921875, -2.4075927734375, -2.270263671875, -2.1329345703125, -1.99560546875, -1.8582763671875, -1.720947265625, -1.5836181640625, -1.4462890625, -1.3089599609375, -1.171630859375, -1.0343017578125, -0.89697265625, -0.7596435546875, -0.622314453125, -0.4849853515625, -0.34765625, -0.2103271484375, -0.072998046875, 0.0643310546875, 0.20166015625, 0.3389892578125, 0.476318359375, 0.6136474609375, 0.7509765625, 0.8883056640625, 1.025634765625, 1.1629638671875, 1.30029296875, 1.4376220703125, 1.574951171875, 1.7122802734375, 1.849609375, 1.9869384765625, 2.124267578125, 2.2615966796875, 2.39892578125, 2.5362548828125, 2.673583984375, 2.8109130859375, 2.9482421875, 3.0855712890625, 3.222900390625, 3.3602294921875, 3.49755859375, 3.6348876953125, 3.772216796875, 3.9095458984375, 4.046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 13.0, 7.0, 10.0, 15.0, 33.0, 28.0, 36.0, 52.0, 58.0, 107.0, 141.0, 202.0, 320.0, 450.0, 808.0, 1372.0, 2647.0, 5488.0, 12776.0, 37830.0, 833697.0, 114640.0, 21052.0, 8142.0, 3769.0, 1917.0, 1051.0, 614.0, 365.0, 254.0, 153.0, 118.0, 99.0, 67.0, 46.0, 33.0, 27.0, 24.0, 21.0, 17.0, 13.0, 8.0, 11.0, 7.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.154296875, -1.1179351806640625, -1.081573486328125, -1.0452117919921875, -1.00885009765625, -0.9724884033203125, -0.936126708984375, -0.8997650146484375, -0.8634033203125, -0.8270416259765625, -0.790679931640625, -0.7543182373046875, -0.71795654296875, -0.6815948486328125, -0.645233154296875, -0.6088714599609375, -0.572509765625, -0.5361480712890625, -0.499786376953125, -0.4634246826171875, -0.42706298828125, -0.3907012939453125, -0.354339599609375, -0.3179779052734375, -0.2816162109375, -0.2452545166015625, -0.208892822265625, -0.1725311279296875, -0.13616943359375, -0.0998077392578125, -0.063446044921875, -0.0270843505859375, 0.00927734375, 0.0456390380859375, 0.082000732421875, 0.1183624267578125, 0.15472412109375, 0.1910858154296875, 0.227447509765625, 0.2638092041015625, 0.3001708984375, 0.3365325927734375, 0.372894287109375, 0.4092559814453125, 0.44561767578125, 0.4819793701171875, 0.518341064453125, 0.5547027587890625, 0.591064453125, 0.6274261474609375, 0.663787841796875, 0.7001495361328125, 0.73651123046875, 0.7728729248046875, 0.809234619140625, 0.8455963134765625, 0.8819580078125, 0.9183197021484375, 0.954681396484375, 0.9910430908203125, 1.02740478515625, 1.0637664794921875, 1.100128173828125, 1.1364898681640625, 1.1728515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 5.0, 13.0, 16.0, 15.0, 22.0, 25.0, 43.0, 52.0, 67.0, 73.0, 78.0, 100.0, 85.0, 65.0, 66.0, 63.0, 55.0, 36.0, 27.0, 17.0, 13.0, 15.0, 5.0, 10.0, 7.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.273124694824219e-05, -8.015520870685577e-05, -7.757917046546936e-05, -7.500313222408295e-05, -7.242709398269653e-05, -6.985105574131012e-05, -6.72750174999237e-05, -6.469897925853729e-05, -6.212294101715088e-05, -5.9546902775764465e-05, -5.697086453437805e-05, -5.439482629299164e-05, -5.1818788051605225e-05, -4.924274981021881e-05, -4.66667115688324e-05, -4.4090673327445984e-05, -4.151463508605957e-05, -3.893859684467316e-05, -3.636255860328674e-05, -3.378652036190033e-05, -3.1210482120513916e-05, -2.8634443879127502e-05, -2.605840563774109e-05, -2.3482367396354675e-05, -2.0906329154968262e-05, -1.8330290913581848e-05, -1.5754252672195435e-05, -1.3178214430809021e-05, -1.0602176189422607e-05, -8.026137948036194e-06, -5.45009970664978e-06, -2.8740614652633667e-06, -2.980232238769531e-07, 2.2780150175094604e-06, 4.854053258895874e-06, 7.430091500282288e-06, 1.0006129741668701e-05, 1.2582167983055115e-05, 1.5158206224441528e-05, 1.7734244465827942e-05, 2.0310282707214355e-05, 2.288632094860077e-05, 2.5462359189987183e-05, 2.8038397431373596e-05, 3.061443567276001e-05, 3.319047391414642e-05, 3.576651215553284e-05, 3.834255039691925e-05, 4.0918588638305664e-05, 4.349462687969208e-05, 4.607066512107849e-05, 4.8646703362464905e-05, 5.122274160385132e-05, 5.379877984523773e-05, 5.6374818086624146e-05, 5.895085632801056e-05, 6.152689456939697e-05, 6.410293281078339e-05, 6.66789710521698e-05, 6.925500929355621e-05, 7.183104753494263e-05, 7.440708577632904e-05, 7.698312401771545e-05, 7.955916225910187e-05, 8.213520050048828e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 17.0, 20.0, 47.0, 56.0, 100.0, 143.0, 182.0, 281.0, 394.0, 598.0, 932.0, 1282.0, 2011.0, 3150.0, 5058.0, 8464.0, 15412.0, 30400.0, 64613.0, 139100.0, 267475.0, 254633.0, 129705.0, 59658.0, 28346.0, 14593.0, 8099.0, 4871.0, 3007.0, 1941.0, 1340.0, 811.0, 539.0, 394.0, 306.0, 177.0, 123.0, 86.0, 59.0, 41.0, 25.0, 20.0, 16.0, 9.0, 8.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.111328125, -1.0754241943359375, -1.039520263671875, -1.0036163330078125, -0.96771240234375, -0.9318084716796875, -0.895904541015625, -0.8600006103515625, -0.8240966796875, -0.7881927490234375, -0.752288818359375, -0.7163848876953125, -0.68048095703125, -0.6445770263671875, -0.608673095703125, -0.5727691650390625, -0.536865234375, -0.5009613037109375, -0.465057373046875, -0.4291534423828125, -0.39324951171875, -0.3573455810546875, -0.321441650390625, -0.2855377197265625, -0.2496337890625, -0.2137298583984375, -0.177825927734375, -0.1419219970703125, -0.10601806640625, -0.0701141357421875, -0.034210205078125, 0.0016937255859375, 0.03759765625, 0.0735015869140625, 0.109405517578125, 0.1453094482421875, 0.18121337890625, 0.2171173095703125, 0.253021240234375, 0.2889251708984375, 0.3248291015625, 0.3607330322265625, 0.396636962890625, 0.4325408935546875, 0.46844482421875, 0.5043487548828125, 0.540252685546875, 0.5761566162109375, 0.612060546875, 0.6479644775390625, 0.683868408203125, 0.7197723388671875, 0.75567626953125, 0.7915802001953125, 0.827484130859375, 0.8633880615234375, 0.8992919921875, 0.9351959228515625, 0.971099853515625, 1.0070037841796875, 1.04290771484375, 1.0788116455078125, 1.114715576171875, 1.1506195068359375, 1.1865234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 8.0, 6.0, 23.0, 10.0, 22.0, 17.0, 34.0, 33.0, 43.0, 54.0, 74.0, 114.0, 111.0, 90.0, 73.0, 51.0, 37.0, 43.0, 31.0, 18.0, 20.0, 22.0, 10.0, 7.0, 13.0, 7.0, 3.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47216796875, -0.4589118957519531, -0.44565582275390625, -0.4323997497558594, -0.4191436767578125, -0.4058876037597656, -0.39263153076171875, -0.3793754577636719, -0.366119384765625, -0.3528633117675781, -0.33960723876953125, -0.3263511657714844, -0.3130950927734375, -0.2998390197753906, -0.28658294677734375, -0.2733268737792969, -0.26007080078125, -0.24681472778320312, -0.23355865478515625, -0.22030258178710938, -0.2070465087890625, -0.19379043579101562, -0.18053436279296875, -0.16727828979492188, -0.154022216796875, -0.14076614379882812, -0.12751007080078125, -0.11425399780273438, -0.1009979248046875, -0.08774185180664062, -0.07448577880859375, -0.061229705810546875, -0.0479736328125, -0.034717559814453125, -0.02146148681640625, -0.008205413818359375, 0.0050506591796875, 0.018306732177734375, 0.03156280517578125, 0.044818878173828125, 0.058074951171875, 0.07133102416992188, 0.08458709716796875, 0.09784317016601562, 0.1110992431640625, 0.12435531616210938, 0.13761138916015625, 0.15086746215820312, 0.16412353515625, 0.17737960815429688, 0.19063568115234375, 0.20389175415039062, 0.2171478271484375, 0.23040390014648438, 0.24365997314453125, 0.2569160461425781, 0.270172119140625, 0.2834281921386719, 0.29668426513671875, 0.3099403381347656, 0.3231964111328125, 0.3364524841308594, 0.34970855712890625, 0.3629646301269531, 0.376220703125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 6.0, 9.0, 7.0, 5.0, 11.0, 11.0, 12.0, 9.0, 21.0, 27.0, 32.0, 25.0, 19.0, 27.0, 28.0, 23.0, 28.0, 44.0, 39.0, 43.0, 53.0, 31.0, 53.0, 37.0, 34.0, 39.0, 37.0, 37.0, 34.0, 29.0, 30.0, 17.0, 19.0, 16.0, 18.0, 13.0, 16.0, 9.0, 6.0, 6.0, 7.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-5.38533353805542, -5.218801498413086, -5.05226993560791, -4.885737895965576, -4.719205856323242, -4.552674293518066, -4.386142253875732, -4.219610214233398, -4.053078651428223, -3.8865468502044678, -3.720014810562134, -3.553483009338379, -3.386950969696045, -3.22041916847229, -3.053887367248535, -2.887355327606201, -2.720823287963867, -2.5542914867401123, -2.3877594470977783, -2.2212276458740234, -2.0546956062316895, -1.8881638050079346, -1.7216320037841797, -1.5551000833511353, -1.3885681629180908, -1.2220362424850464, -1.055504322052002, -0.8889725208282471, -0.7224406003952026, -0.5559086799621582, -0.38937681913375854, -0.2228449583053589, -0.056313514709472656, 0.11021837592124939, 0.27675026655197144, 0.4432821571826935, 0.6098140478134155, 0.77634596824646, 0.9428778290748596, 1.1094096899032593, 1.2759416103363037, 1.4424735307693481, 1.6090054512023926, 1.7755372524261475, 1.942069172859192, 2.1086010932922363, 2.275132894515991, 2.441664695739746, 2.60819673538208, 2.774728536605835, 2.941260576248169, 3.107792377471924, 3.274324417114258, 3.4408562183380127, 3.6073880195617676, 3.7739200592041016, 3.9404518604278564, 4.106983661651611, 4.273515701293945, 4.440047740936279, 4.606579303741455, 4.773111343383789, 4.939643383026123, 5.106174945831299, 5.272706985473633]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 6.0, 4.0, 8.0, 12.0, 8.0, 18.0, 11.0, 13.0, 14.0, 19.0, 21.0, 19.0, 22.0, 25.0, 33.0, 31.0, 37.0, 27.0, 41.0, 44.0, 46.0, 54.0, 39.0, 38.0, 44.0, 36.0, 35.0, 37.0, 31.0, 26.0, 35.0, 23.0, 25.0, 20.0, 14.0, 13.0, 16.0, 9.0, 7.0, 7.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.695402145385742, -5.515336036682129, -5.335269927978516, -5.155203819274902, -4.975137710571289, -4.795071601867676, -4.6150054931640625, -4.434938907623291, -4.254872798919678, -4.0748066902160645, -3.894740581512451, -3.714674472808838, -3.5346081256866455, -3.3545420169830322, -3.174475908279419, -2.9944095611572266, -2.8143436908721924, -2.634277582168579, -2.454211473464966, -2.2741451263427734, -2.09407901763916, -1.9140129089355469, -1.7339468002319336, -1.5538805723190308, -1.3738144636154175, -1.1937483549118042, -1.0136821269989014, -0.8336160182952881, -0.65354984998703, -0.473483681678772, -0.2934175729751587, -0.11335134506225586, 0.06671476364135742, 0.24678091704845428, 0.42684707045555115, 0.6069132089614868, 0.7869793772697449, 0.9670455455780029, 1.1471116542816162, 1.327177882194519, 1.5072439908981323, 1.6873100996017456, 1.8673763275146484, 2.0474424362182617, 2.227508544921875, 2.4075746536254883, 2.5876407623291016, 2.767707109451294, 2.9477732181549072, 3.1278393268585205, 3.307905435562134, 3.487971782684326, 3.6680378913879395, 3.8481040000915527, 4.028170108795166, 4.208236217498779, 4.388302326202393, 4.568368434906006, 4.748434543609619, 4.928500652313232, 5.108566761016846, 5.288633346557617, 5.4686994552612305, 5.648765563964844, 5.828831672668457]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 4.0, 3.0, 8.0, 10.0, 22.0, 35.0, 56.0, 84.0, 133.0, 205.0, 349.0, 530.0, 847.0, 1457.0, 2234.0, 3591.0, 5626.0, 8789.0, 13403.0, 20314.0, 29638.0, 41804.0, 56322.0, 73616.0, 88431.0, 101062.0, 106298.0, 103896.0, 93874.0, 80062.0, 63460.0, 48156.0, 34595.0, 23958.0, 16157.0, 10765.0, 6945.0, 4386.0, 2827.0, 1721.0, 1075.0, 693.0, 414.0, 262.0, 158.0, 108.0, 75.0, 37.0, 28.0, 10.0, 14.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.53125, -4.3787841796875, -4.226318359375, -4.0738525390625, -3.92138671875, -3.7689208984375, -3.616455078125, -3.4639892578125, -3.3115234375, -3.1590576171875, -3.006591796875, -2.8541259765625, -2.70166015625, -2.5491943359375, -2.396728515625, -2.2442626953125, -2.091796875, -1.9393310546875, -1.786865234375, -1.6343994140625, -1.48193359375, -1.3294677734375, -1.177001953125, -1.0245361328125, -0.8720703125, -0.7196044921875, -0.567138671875, -0.4146728515625, -0.26220703125, -0.1097412109375, 0.042724609375, 0.1951904296875, 0.34765625, 0.5001220703125, 0.652587890625, 0.8050537109375, 0.95751953125, 1.1099853515625, 1.262451171875, 1.4149169921875, 1.5673828125, 1.7198486328125, 1.872314453125, 2.0247802734375, 2.17724609375, 2.3297119140625, 2.482177734375, 2.6346435546875, 2.787109375, 2.9395751953125, 3.092041015625, 3.2445068359375, 3.39697265625, 3.5494384765625, 3.701904296875, 3.8543701171875, 4.0068359375, 4.1593017578125, 4.311767578125, 4.4642333984375, 4.61669921875, 4.7691650390625, 4.921630859375, 5.0740966796875, 5.2265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 12.0, 11.0, 13.0, 8.0, 11.0, 9.0, 14.0, 22.0, 21.0, 20.0, 27.0, 30.0, 26.0, 39.0, 31.0, 38.0, 42.0, 41.0, 53.0, 43.0, 49.0, 41.0, 33.0, 45.0, 31.0, 38.0, 40.0, 34.0, 28.0, 22.0, 25.0, 18.0, 15.0, 7.0, 11.0, 11.0, 9.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.1328125, -5.94329833984375, -5.7537841796875, -5.56427001953125, -5.374755859375, -5.18524169921875, -4.9957275390625, -4.80621337890625, -4.61669921875, -4.42718505859375, -4.2376708984375, -4.04815673828125, -3.858642578125, -3.66912841796875, -3.4796142578125, -3.29010009765625, -3.1005859375, -2.91107177734375, -2.7215576171875, -2.53204345703125, -2.342529296875, -2.15301513671875, -1.9635009765625, -1.77398681640625, -1.58447265625, -1.39495849609375, -1.2054443359375, -1.01593017578125, -0.826416015625, -0.63690185546875, -0.4473876953125, -0.25787353515625, -0.068359375, 0.12115478515625, 0.3106689453125, 0.50018310546875, 0.689697265625, 0.87921142578125, 1.0687255859375, 1.25823974609375, 1.44775390625, 1.63726806640625, 1.8267822265625, 2.01629638671875, 2.205810546875, 2.39532470703125, 2.5848388671875, 2.77435302734375, 2.9638671875, 3.15338134765625, 3.3428955078125, 3.53240966796875, 3.721923828125, 3.91143798828125, 4.1009521484375, 4.29046630859375, 4.47998046875, 4.66949462890625, 4.8590087890625, 5.04852294921875, 5.238037109375, 5.42755126953125, 5.6170654296875, 5.80657958984375, 5.99609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 3.0, 14.0, 18.0, 13.0, 36.0, 53.0, 90.0, 115.0, 236.0, 375.0, 606.0, 1026.0, 1643.0, 2726.0, 4623.0, 7714.0, 12721.0, 20095.0, 31174.0, 46786.0, 66415.0, 88100.0, 107343.0, 119757.0, 121088.0, 111352.0, 91983.0, 70800.0, 50141.0, 33930.0, 22237.0, 13791.0, 8664.0, 5189.0, 3067.0, 1858.0, 1060.0, 667.0, 417.0, 232.0, 158.0, 87.0, 56.0, 45.0, 22.0, 13.0, 8.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.41796875, -7.200439453125, -6.98291015625, -6.765380859375, -6.5478515625, -6.330322265625, -6.11279296875, -5.895263671875, -5.677734375, -5.460205078125, -5.24267578125, -5.025146484375, -4.8076171875, -4.590087890625, -4.37255859375, -4.155029296875, -3.9375, -3.719970703125, -3.50244140625, -3.284912109375, -3.0673828125, -2.849853515625, -2.63232421875, -2.414794921875, -2.197265625, -1.979736328125, -1.76220703125, -1.544677734375, -1.3271484375, -1.109619140625, -0.89208984375, -0.674560546875, -0.45703125, -0.239501953125, -0.02197265625, 0.195556640625, 0.4130859375, 0.630615234375, 0.84814453125, 1.065673828125, 1.283203125, 1.500732421875, 1.71826171875, 1.935791015625, 2.1533203125, 2.370849609375, 2.58837890625, 2.805908203125, 3.0234375, 3.240966796875, 3.45849609375, 3.676025390625, 3.8935546875, 4.111083984375, 4.32861328125, 4.546142578125, 4.763671875, 4.981201171875, 5.19873046875, 5.416259765625, 5.6337890625, 5.851318359375, 6.06884765625, 6.286376953125, 6.50390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 5.0, 4.0, 7.0, 12.0, 9.0, 13.0, 11.0, 14.0, 19.0, 28.0, 19.0, 15.0, 20.0, 30.0, 26.0, 37.0, 38.0, 34.0, 36.0, 39.0, 30.0, 38.0, 39.0, 36.0, 36.0, 29.0, 39.0, 31.0, 26.0, 27.0, 20.0, 24.0, 26.0, 23.0, 23.0, 18.0, 13.0, 20.0, 11.0, 12.0, 10.0, 6.0, 10.0, 7.0, 8.0, 3.0, 2.0, 5.0, 3.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-3.369140625, -3.263946533203125, -3.15875244140625, -3.053558349609375, -2.9483642578125, -2.843170166015625, -2.73797607421875, -2.632781982421875, -2.527587890625, -2.422393798828125, -2.31719970703125, -2.212005615234375, -2.1068115234375, -2.001617431640625, -1.89642333984375, -1.791229248046875, -1.68603515625, -1.580841064453125, -1.47564697265625, -1.370452880859375, -1.2652587890625, -1.160064697265625, -1.05487060546875, -0.949676513671875, -0.844482421875, -0.739288330078125, -0.63409423828125, -0.528900146484375, -0.4237060546875, -0.318511962890625, -0.21331787109375, -0.108123779296875, -0.0029296875, 0.102264404296875, 0.20745849609375, 0.312652587890625, 0.4178466796875, 0.523040771484375, 0.62823486328125, 0.733428955078125, 0.838623046875, 0.943817138671875, 1.04901123046875, 1.154205322265625, 1.2593994140625, 1.364593505859375, 1.46978759765625, 1.574981689453125, 1.68017578125, 1.785369873046875, 1.89056396484375, 1.995758056640625, 2.1009521484375, 2.206146240234375, 2.31134033203125, 2.416534423828125, 2.521728515625, 2.626922607421875, 2.73211669921875, 2.837310791015625, 2.9425048828125, 3.047698974609375, 3.15289306640625, 3.258087158203125, 3.36328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 23.0, 21.0, 37.0, 57.0, 89.0, 114.0, 166.0, 225.0, 363.0, 530.0, 813.0, 1196.0, 1837.0, 2862.0, 4217.0, 6560.0, 10116.0, 15597.0, 23270.0, 34569.0, 48738.0, 66514.0, 86508.0, 103681.0, 114227.0, 114397.0, 103877.0, 86681.0, 67596.0, 49578.0, 34918.0, 23346.0, 15655.0, 10453.0, 6763.0, 4455.0, 2876.0, 1800.0, 1262.0, 841.0, 557.0, 362.0, 255.0, 160.0, 145.0, 77.0, 40.0, 39.0, 33.0, 16.0, 9.0, 10.0, 11.0, 2.0, 1.0, 1.0], "bins": [-1.51953125, -1.4735107421875, -1.427490234375, -1.3814697265625, -1.33544921875, -1.2894287109375, -1.243408203125, -1.1973876953125, -1.1513671875, -1.1053466796875, -1.059326171875, -1.0133056640625, -0.96728515625, -0.9212646484375, -0.875244140625, -0.8292236328125, -0.783203125, -0.7371826171875, -0.691162109375, -0.6451416015625, -0.59912109375, -0.5531005859375, -0.507080078125, -0.4610595703125, -0.4150390625, -0.3690185546875, -0.322998046875, -0.2769775390625, -0.23095703125, -0.1849365234375, -0.138916015625, -0.0928955078125, -0.046875, -0.0008544921875, 0.045166015625, 0.0911865234375, 0.13720703125, 0.1832275390625, 0.229248046875, 0.2752685546875, 0.3212890625, 0.3673095703125, 0.413330078125, 0.4593505859375, 0.50537109375, 0.5513916015625, 0.597412109375, 0.6434326171875, 0.689453125, 0.7354736328125, 0.781494140625, 0.8275146484375, 0.87353515625, 0.9195556640625, 0.965576171875, 1.0115966796875, 1.0576171875, 1.1036376953125, 1.149658203125, 1.1956787109375, 1.24169921875, 1.2877197265625, 1.333740234375, 1.3797607421875, 1.42578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 9.0, 7.0, 7.0, 9.0, 7.0, 14.0, 13.0, 14.0, 16.0, 27.0, 29.0, 30.0, 40.0, 51.0, 53.0, 44.0, 62.0, 49.0, 58.0, 51.0, 59.0, 56.0, 41.0, 44.0, 34.0, 44.0, 27.0, 31.0, 16.0, 17.0, 9.0, 11.0, 12.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015497207641601562, -0.00014794990420341492, -0.0001409277319908142, -0.0001339055597782135, -0.0001268833875656128, -0.00011986121535301208, -0.00011283904314041138, -0.00010581687092781067, -9.879469871520996e-05, -9.177252650260925e-05, -8.475035429000854e-05, -7.772818207740784e-05, -7.070600986480713e-05, -6.368383765220642e-05, -5.666166543960571e-05, -4.9639493227005005e-05, -4.26173210144043e-05, -3.559514880180359e-05, -2.857297658920288e-05, -2.1550804376602173e-05, -1.4528632164001465e-05, -7.506459951400757e-06, -4.842877388000488e-07, 6.537884473800659e-06, 1.3560056686401367e-05, 2.0582228899002075e-05, 2.7604401111602783e-05, 3.462657332420349e-05, 4.16487455368042e-05, 4.867091774940491e-05, 5.5693089962005615e-05, 6.271526217460632e-05, 6.973743438720703e-05, 7.675960659980774e-05, 8.378177881240845e-05, 9.080395102500916e-05, 9.782612323760986e-05, 0.00010484829545021057, 0.00011187046766281128, 0.00011889263987541199, 0.0001259148120880127, 0.0001329369843006134, 0.0001399591565132141, 0.00014698132872581482, 0.00015400350093841553, 0.00016102567315101624, 0.00016804784536361694, 0.00017507001757621765, 0.00018209218978881836, 0.00018911436200141907, 0.00019613653421401978, 0.00020315870642662048, 0.0002101808786392212, 0.0002172030508518219, 0.0002242252230644226, 0.00023124739527702332, 0.00023826956748962402, 0.00024529173970222473, 0.00025231391191482544, 0.00025933608412742615, 0.00026635825634002686, 0.00027338042855262756, 0.00028040260076522827, 0.000287424772977829, 0.0002944469451904297]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 11.0, 21.0, 29.0, 39.0, 55.0, 93.0, 138.0, 223.0, 310.0, 489.0, 694.0, 1158.0, 1636.0, 2573.0, 3925.0, 5995.0, 9196.0, 13582.0, 20307.0, 29696.0, 41789.0, 57230.0, 73932.0, 90094.0, 102800.0, 107780.0, 104552.0, 94228.0, 78249.0, 61445.0, 45964.0, 32824.0, 22435.0, 15340.0, 10173.0, 6739.0, 4350.0, 2951.0, 1882.0, 1263.0, 809.0, 545.0, 348.0, 216.0, 146.0, 90.0, 64.0, 44.0, 34.0, 21.0, 23.0, 8.0, 6.0, 6.0, 2.0, 1.0, 2.0], "bins": [-1.40625, -1.3631591796875, -1.320068359375, -1.2769775390625, -1.23388671875, -1.1907958984375, -1.147705078125, -1.1046142578125, -1.0615234375, -1.0184326171875, -0.975341796875, -0.9322509765625, -0.88916015625, -0.8460693359375, -0.802978515625, -0.7598876953125, -0.716796875, -0.6737060546875, -0.630615234375, -0.5875244140625, -0.54443359375, -0.5013427734375, -0.458251953125, -0.4151611328125, -0.3720703125, -0.3289794921875, -0.285888671875, -0.2427978515625, -0.19970703125, -0.1566162109375, -0.113525390625, -0.0704345703125, -0.02734375, 0.0157470703125, 0.058837890625, 0.1019287109375, 0.14501953125, 0.1881103515625, 0.231201171875, 0.2742919921875, 0.3173828125, 0.3604736328125, 0.403564453125, 0.4466552734375, 0.48974609375, 0.5328369140625, 0.575927734375, 0.6190185546875, 0.662109375, 0.7052001953125, 0.748291015625, 0.7913818359375, 0.83447265625, 0.8775634765625, 0.920654296875, 0.9637451171875, 1.0068359375, 1.0499267578125, 1.093017578125, 1.1361083984375, 1.17919921875, 1.2222900390625, 1.265380859375, 1.3084716796875, 1.3515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 10.0, 8.0, 9.0, 20.0, 21.0, 30.0, 34.0, 41.0, 36.0, 48.0, 58.0, 57.0, 65.0, 52.0, 46.0, 51.0, 62.0, 37.0, 60.0, 40.0, 35.0, 24.0, 32.0, 25.0, 17.0, 18.0, 12.0, 11.0, 10.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73876953125, -0.7133712768554688, -0.6879730224609375, -0.6625747680664062, -0.637176513671875, -0.6117782592773438, -0.5863800048828125, -0.5609817504882812, -0.53558349609375, -0.5101852416992188, -0.4847869873046875, -0.45938873291015625, -0.433990478515625, -0.40859222412109375, -0.3831939697265625, -0.35779571533203125, -0.3323974609375, -0.30699920654296875, -0.2816009521484375, -0.25620269775390625, -0.230804443359375, -0.20540618896484375, -0.1800079345703125, -0.15460968017578125, -0.12921142578125, -0.10381317138671875, -0.0784149169921875, -0.05301666259765625, -0.027618408203125, -0.00222015380859375, 0.0231781005859375, 0.04857635498046875, 0.073974609375, 0.09937286376953125, 0.1247711181640625, 0.15016937255859375, 0.175567626953125, 0.20096588134765625, 0.2263641357421875, 0.25176239013671875, 0.27716064453125, 0.30255889892578125, 0.3279571533203125, 0.35335540771484375, 0.378753662109375, 0.40415191650390625, 0.4295501708984375, 0.45494842529296875, 0.4803466796875, 0.5057449340820312, 0.5311431884765625, 0.5565414428710938, 0.581939697265625, 0.6073379516601562, 0.6327362060546875, 0.6581344604492188, 0.68353271484375, 0.7089309692382812, 0.7343292236328125, 0.7597274780273438, 0.785125732421875, 0.8105239868164062, 0.8359222412109375, 0.8613204956054688, 0.88671875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 13.0, 8.0, 16.0, 15.0, 13.0, 12.0, 12.0, 23.0, 22.0, 28.0, 25.0, 32.0, 25.0, 30.0, 42.0, 36.0, 48.0, 35.0, 38.0, 39.0, 40.0, 42.0, 40.0, 40.0, 35.0, 32.0, 39.0, 36.0, 22.0, 11.0, 20.0, 21.0, 22.0, 12.0, 11.0, 9.0, 5.0, 3.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0], "bins": [-5.293663501739502, -5.1222357749938965, -4.950808048248291, -4.7793803215026855, -4.60795259475708, -4.436524868011475, -4.265097618103027, -4.093669891357422, -3.9222419261932373, -3.750814199447632, -3.5793864727020264, -3.407958984375, -3.2365312576293945, -3.065103530883789, -2.8936758041381836, -2.722248077392578, -2.5508203506469727, -2.379392623901367, -2.2079648971557617, -2.0365371704101562, -1.8651095628738403, -1.6936818361282349, -1.522254228591919, -1.3508265018463135, -1.179398775100708, -1.0079710483551025, -0.8365433812141418, -0.6651157140731812, -0.4936879873275757, -0.3222602605819702, -0.1508326530456543, 0.020595073699951172, 0.19202327728271484, 0.3634509742259979, 0.534878671169281, 0.7063063383102417, 0.8777340650558472, 1.0491617918014526, 1.2205893993377686, 1.392017126083374, 1.5634448528289795, 1.734872579574585, 1.9063003063201904, 2.077727794647217, 2.2491555213928223, 2.4205832481384277, 2.592010974884033, 2.7634387016296387, 2.934866428375244, 3.1062941551208496, 3.277721881866455, 3.4491496086120605, 3.620577335357666, 3.7920050621032715, 3.963432550430298, 4.134860038757324, 4.30628776550293, 4.477715492248535, 4.649143218994141, 4.820570945739746, 4.991998672485352, 5.163426399230957, 5.3348541259765625, 5.506281852722168, 5.677709579467773]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 7.0, 2.0, 7.0, 9.0, 12.0, 11.0, 19.0, 16.0, 21.0, 19.0, 26.0, 30.0, 33.0, 31.0, 35.0, 39.0, 45.0, 40.0, 46.0, 37.0, 48.0, 40.0, 51.0, 39.0, 40.0, 40.0, 32.0, 32.0, 34.0, 22.0, 21.0, 16.0, 15.0, 16.0, 10.0, 12.0, 10.0, 5.0, 6.0, 6.0, 6.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.248567581176758, -6.045586585998535, -5.8426055908203125, -5.639625072479248, -5.436644077301025, -5.233663082122803, -5.03068208694458, -4.827701568603516, -4.624720573425293, -4.42173957824707, -4.218758583068848, -4.015778064727783, -3.8127970695495605, -3.609816074371338, -3.4068350791931152, -3.2038543224334717, -3.000873327255249, -2.7978923320770264, -2.594911575317383, -2.39193058013916, -2.1889498233795166, -1.985968828201294, -1.7829879522323608, -1.5800070762634277, -1.3770262002944946, -1.1740453243255615, -0.9710644483566284, -0.7680835127830505, -0.5651026368141174, -0.36212170124053955, -0.15914082527160645, 0.04384005069732666, 0.24682092666625977, 0.44980180263519287, 0.652782678604126, 0.8557636141777039, 1.0587444305419922, 1.2617254257202148, 1.464706301689148, 1.667687177658081, 1.8706680536270142, 2.0736489295959473, 2.27662992477417, 2.4796106815338135, 2.682591676712036, 2.8855724334716797, 3.0885534286499023, 3.291534423828125, 3.4945151805877686, 3.697496175765991, 3.9004769325256348, 4.103457927703857, 4.30643892288208, 4.5094194412231445, 4.712400436401367, 4.91538143157959, 5.1183624267578125, 5.321343421936035, 5.524324417114258, 5.727304935455322, 5.930285930633545, 6.133266925811768, 6.33624792098999, 6.539228439331055, 6.742209434509277]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 6.0, 13.0, 21.0, 58.0, 60.0, 107.0, 184.0, 294.0, 510.0, 890.0, 1562.0, 2565.0, 4545.0, 7981.0, 13707.0, 24113.0, 41427.0, 72297.0, 124912.0, 209447.0, 337228.0, 498718.0, 638331.0, 662082.0, 555200.0, 391295.0, 249134.0, 150500.0, 88229.0, 50996.0, 29184.0, 16510.0, 9233.0, 5449.0, 3244.0, 1722.0, 1040.0, 602.0, 363.0, 214.0, 113.0, 78.0, 47.0, 25.0, 22.0, 6.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.578125, -5.39923095703125, -5.2203369140625, -5.04144287109375, -4.862548828125, -4.68365478515625, -4.5047607421875, -4.32586669921875, -4.14697265625, -3.96807861328125, -3.7891845703125, -3.61029052734375, -3.431396484375, -3.25250244140625, -3.0736083984375, -2.89471435546875, -2.7158203125, -2.53692626953125, -2.3580322265625, -2.17913818359375, -2.000244140625, -1.82135009765625, -1.6424560546875, -1.46356201171875, -1.28466796875, -1.10577392578125, -0.9268798828125, -0.74798583984375, -0.569091796875, -0.39019775390625, -0.2113037109375, -0.03240966796875, 0.146484375, 0.32537841796875, 0.5042724609375, 0.68316650390625, 0.862060546875, 1.04095458984375, 1.2198486328125, 1.39874267578125, 1.57763671875, 1.75653076171875, 1.9354248046875, 2.11431884765625, 2.293212890625, 2.47210693359375, 2.6510009765625, 2.82989501953125, 3.0087890625, 3.18768310546875, 3.3665771484375, 3.54547119140625, 3.724365234375, 3.90325927734375, 4.0821533203125, 4.26104736328125, 4.43994140625, 4.61883544921875, 4.7977294921875, 4.97662353515625, 5.155517578125, 5.33441162109375, 5.5133056640625, 5.69219970703125, 5.87109375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 3.0, 2.0, 10.0, 6.0, 10.0, 22.0, 8.0, 9.0, 21.0, 19.0, 19.0, 22.0, 34.0, 25.0, 26.0, 34.0, 34.0, 31.0, 33.0, 39.0, 40.0, 47.0, 37.0, 33.0, 32.0, 38.0, 43.0, 40.0, 28.0, 31.0, 36.0, 22.0, 17.0, 17.0, 15.0, 17.0, 16.0, 11.0, 19.0, 6.0, 8.0, 4.0, 9.0, 2.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.93359375, -4.7791748046875, -4.624755859375, -4.4703369140625, -4.31591796875, -4.1614990234375, -4.007080078125, -3.8526611328125, -3.6982421875, -3.5438232421875, -3.389404296875, -3.2349853515625, -3.08056640625, -2.9261474609375, -2.771728515625, -2.6173095703125, -2.462890625, -2.3084716796875, -2.154052734375, -1.9996337890625, -1.84521484375, -1.6907958984375, -1.536376953125, -1.3819580078125, -1.2275390625, -1.0731201171875, -0.918701171875, -0.7642822265625, -0.60986328125, -0.4554443359375, -0.301025390625, -0.1466064453125, 0.0078125, 0.1622314453125, 0.316650390625, 0.4710693359375, 0.62548828125, 0.7799072265625, 0.934326171875, 1.0887451171875, 1.2431640625, 1.3975830078125, 1.552001953125, 1.7064208984375, 1.86083984375, 2.0152587890625, 2.169677734375, 2.3240966796875, 2.478515625, 2.6329345703125, 2.787353515625, 2.9417724609375, 3.09619140625, 3.2506103515625, 3.405029296875, 3.5594482421875, 3.7138671875, 3.8682861328125, 4.022705078125, 4.1771240234375, 4.33154296875, 4.4859619140625, 4.640380859375, 4.7947998046875, 4.94921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 11.0, 13.0, 23.0, 30.0, 56.0, 78.0, 154.0, 221.0, 321.0, 561.0, 930.0, 1439.0, 2357.0, 3838.0, 6311.0, 10189.0, 16693.0, 27410.0, 44358.0, 70441.0, 110538.0, 170807.0, 254268.0, 360869.0, 475301.0, 552058.0, 551433.0, 469592.0, 356719.0, 250134.0, 167418.0, 109190.0, 68658.0, 43073.0, 26510.0, 16425.0, 9953.0, 6114.0, 3714.0, 2303.0, 1427.0, 872.0, 573.0, 343.0, 183.0, 166.0, 93.0, 48.0, 26.0, 10.0, 18.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0], "bins": [-5.14453125, -4.988525390625, -4.83251953125, -4.676513671875, -4.5205078125, -4.364501953125, -4.20849609375, -4.052490234375, -3.896484375, -3.740478515625, -3.58447265625, -3.428466796875, -3.2724609375, -3.116455078125, -2.96044921875, -2.804443359375, -2.6484375, -2.492431640625, -2.33642578125, -2.180419921875, -2.0244140625, -1.868408203125, -1.71240234375, -1.556396484375, -1.400390625, -1.244384765625, -1.08837890625, -0.932373046875, -0.7763671875, -0.620361328125, -0.46435546875, -0.308349609375, -0.15234375, 0.003662109375, 0.15966796875, 0.315673828125, 0.4716796875, 0.627685546875, 0.78369140625, 0.939697265625, 1.095703125, 1.251708984375, 1.40771484375, 1.563720703125, 1.7197265625, 1.875732421875, 2.03173828125, 2.187744140625, 2.34375, 2.499755859375, 2.65576171875, 2.811767578125, 2.9677734375, 3.123779296875, 3.27978515625, 3.435791015625, 3.591796875, 3.747802734375, 3.90380859375, 4.059814453125, 4.2158203125, 4.371826171875, 4.52783203125, 4.683837890625, 4.83984375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 9.0, 13.0, 8.0, 14.0, 7.0, 22.0, 16.0, 27.0, 31.0, 55.0, 40.0, 74.0, 66.0, 90.0, 118.0, 102.0, 174.0, 183.0, 176.0, 232.0, 216.0, 215.0, 255.0, 233.0, 246.0, 222.0, 214.0, 172.0, 138.0, 134.0, 112.0, 105.0, 70.0, 52.0, 37.0, 37.0, 33.0, 24.0, 24.0, 22.0, 17.0, 9.0, 10.0, 8.0, 3.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.062713623046875, -1.99066162109375, -1.918609619140625, -1.8465576171875, -1.774505615234375, -1.70245361328125, -1.630401611328125, -1.558349609375, -1.486297607421875, -1.41424560546875, -1.342193603515625, -1.2701416015625, -1.198089599609375, -1.12603759765625, -1.053985595703125, -0.98193359375, -0.909881591796875, -0.83782958984375, -0.765777587890625, -0.6937255859375, -0.621673583984375, -0.54962158203125, -0.477569580078125, -0.405517578125, -0.333465576171875, -0.26141357421875, -0.189361572265625, -0.1173095703125, -0.045257568359375, 0.02679443359375, 0.098846435546875, 0.1708984375, 0.242950439453125, 0.31500244140625, 0.387054443359375, 0.4591064453125, 0.531158447265625, 0.60321044921875, 0.675262451171875, 0.747314453125, 0.819366455078125, 0.89141845703125, 0.963470458984375, 1.0355224609375, 1.107574462890625, 1.17962646484375, 1.251678466796875, 1.32373046875, 1.395782470703125, 1.46783447265625, 1.539886474609375, 1.6119384765625, 1.683990478515625, 1.75604248046875, 1.828094482421875, 1.900146484375, 1.972198486328125, 2.04425048828125, 2.116302490234375, 2.1883544921875, 2.260406494140625, 2.33245849609375, 2.404510498046875, 2.4765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 1.0, 8.0, 3.0, 9.0, 9.0, 17.0, 11.0, 19.0, 15.0, 18.0, 26.0, 26.0, 29.0, 34.0, 31.0, 41.0, 30.0, 38.0, 44.0, 44.0, 48.0, 45.0, 37.0, 38.0, 39.0, 45.0, 40.0, 28.0, 42.0, 20.0, 30.0, 13.0, 21.0, 20.0, 18.0, 8.0, 10.0, 10.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.892075538635254, -5.709245681762695, -5.526415824890137, -5.343585968017578, -5.1607561111450195, -4.977925777435303, -4.795095920562744, -4.6122660636901855, -4.429436206817627, -4.246606349945068, -4.06377649307251, -3.880946397781372, -3.6981165409088135, -3.515286684036255, -3.332456588745117, -3.1496267318725586, -2.966796875, -2.7839670181274414, -2.601137161254883, -2.418307065963745, -2.2354772090911865, -2.052647352218628, -1.8698173761367798, -1.6869874000549316, -1.504157543182373, -1.3213276863098145, -1.1384977102279663, -0.9556677937507629, -0.7728378772735596, -0.5900079607963562, -0.40717804431915283, -0.2243480682373047, -0.041518211364746094, 0.14131170511245728, 0.32414162158966064, 0.506971538066864, 0.6898014545440674, 0.8726313710212708, 1.0554612874984741, 1.2382912635803223, 1.4211211204528809, 1.6039509773254395, 1.7867809534072876, 1.9696109294891357, 2.1524407863616943, 2.335270643234253, 2.5181007385253906, 2.700930595397949, 2.883760452270508, 3.0665903091430664, 3.249420166015625, 3.4322502613067627, 3.6150801181793213, 3.79790997505188, 3.9807400703430176, 4.163569927215576, 4.346399784088135, 4.529229640960693, 4.712059497833252, 4.8948893547058105, 5.077719688415527, 5.260549545288086, 5.4433794021606445, 5.626209259033203, 5.809039115905762]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 7.0, 4.0, 8.0, 13.0, 21.0, 6.0, 12.0, 17.0, 23.0, 26.0, 24.0, 29.0, 32.0, 32.0, 25.0, 45.0, 37.0, 50.0, 34.0, 43.0, 37.0, 46.0, 34.0, 52.0, 37.0, 35.0, 30.0, 33.0, 36.0, 24.0, 11.0, 14.0, 15.0, 17.0, 21.0, 13.0, 9.0, 11.0, 7.0, 5.0, 5.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.465060710906982, -5.276137828826904, -5.087214946746826, -4.898292064666748, -4.709369659423828, -4.52044677734375, -4.331523895263672, -4.142601013183594, -3.9536781311035156, -3.7647552490234375, -3.5758323669433594, -3.3869097232818604, -3.1979868412017822, -3.009063959121704, -2.820141315460205, -2.631218433380127, -2.442295551300049, -2.2533726692199707, -2.0644497871398926, -1.8755271434783936, -1.6866042613983154, -1.4976813793182373, -1.3087586164474487, -1.1198358535766602, -0.930912971496582, -0.7419901490211487, -0.5530673265457153, -0.364144504070282, -0.17522168159484863, 0.013701140880584717, 0.20262396335601807, 0.39154672622680664, 0.5804696083068848, 0.7693924307823181, 0.9583152532577515, 1.14723801612854, 1.3361608982086182, 1.5250837802886963, 1.7140065431594849, 1.9029293060302734, 2.0918521881103516, 2.2807750701904297, 2.469697952270508, 2.658620595932007, 2.847543478012085, 3.036466360092163, 3.225389003753662, 3.4143118858337402, 3.6032347679138184, 3.7921576499938965, 3.9810805320739746, 4.170003414154053, 4.358925819396973, 4.547848701477051, 4.736771583557129, 4.925694465637207, 5.114617347717285, 5.303540229797363, 5.492463111877441, 5.6813859939575195, 5.870308876037598, 6.059231281280518, 6.248154163360596, 6.437077045440674, 6.625999927520752]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 12.0, 8.0, 16.0, 33.0, 64.0, 82.0, 118.0, 215.0, 318.0, 469.0, 775.0, 1166.0, 1918.0, 2961.0, 4683.0, 7109.0, 10778.0, 16164.0, 23642.0, 33464.0, 45511.0, 59745.0, 74838.0, 89061.0, 98448.0, 102546.0, 98487.0, 88757.0, 75310.0, 60388.0, 46138.0, 33692.0, 24061.0, 16388.0, 11000.0, 7100.0, 4690.0, 3059.0, 1941.0, 1254.0, 776.0, 479.0, 315.0, 212.0, 134.0, 81.0, 60.0, 38.0, 25.0, 16.0, 12.0, 3.0, 5.0, 1.0, 1.0], "bins": [-2.572265625, -2.49774169921875, -2.4232177734375, -2.34869384765625, -2.274169921875, -2.19964599609375, -2.1251220703125, -2.05059814453125, -1.97607421875, -1.90155029296875, -1.8270263671875, -1.75250244140625, -1.677978515625, -1.60345458984375, -1.5289306640625, -1.45440673828125, -1.3798828125, -1.30535888671875, -1.2308349609375, -1.15631103515625, -1.081787109375, -1.00726318359375, -0.9327392578125, -0.85821533203125, -0.78369140625, -0.70916748046875, -0.6346435546875, -0.56011962890625, -0.485595703125, -0.41107177734375, -0.3365478515625, -0.26202392578125, -0.1875, -0.11297607421875, -0.0384521484375, 0.03607177734375, 0.110595703125, 0.18511962890625, 0.2596435546875, 0.33416748046875, 0.40869140625, 0.48321533203125, 0.5577392578125, 0.63226318359375, 0.706787109375, 0.78131103515625, 0.8558349609375, 0.93035888671875, 1.0048828125, 1.07940673828125, 1.1539306640625, 1.22845458984375, 1.302978515625, 1.37750244140625, 1.4520263671875, 1.52655029296875, 1.60107421875, 1.67559814453125, 1.7501220703125, 1.82464599609375, 1.899169921875, 1.97369384765625, 2.0482177734375, 2.12274169921875, 2.197265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 8.0, 7.0, 15.0, 20.0, 11.0, 10.0, 19.0, 15.0, 20.0, 28.0, 34.0, 25.0, 29.0, 35.0, 35.0, 40.0, 57.0, 46.0, 45.0, 44.0, 34.0, 40.0, 36.0, 45.0, 37.0, 27.0, 36.0, 26.0, 29.0, 16.0, 21.0, 15.0, 17.0, 16.0, 11.0, 6.0, 4.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.13671875, -4.95916748046875, -4.7816162109375, -4.60406494140625, -4.426513671875, -4.24896240234375, -4.0714111328125, -3.89385986328125, -3.71630859375, -3.53875732421875, -3.3612060546875, -3.18365478515625, -3.006103515625, -2.82855224609375, -2.6510009765625, -2.47344970703125, -2.2958984375, -2.11834716796875, -1.9407958984375, -1.76324462890625, -1.585693359375, -1.40814208984375, -1.2305908203125, -1.05303955078125, -0.87548828125, -0.69793701171875, -0.5203857421875, -0.34283447265625, -0.165283203125, 0.01226806640625, 0.1898193359375, 0.36737060546875, 0.544921875, 0.72247314453125, 0.9000244140625, 1.07757568359375, 1.255126953125, 1.43267822265625, 1.6102294921875, 1.78778076171875, 1.96533203125, 2.14288330078125, 2.3204345703125, 2.49798583984375, 2.675537109375, 2.85308837890625, 3.0306396484375, 3.20819091796875, 3.3857421875, 3.56329345703125, 3.7408447265625, 3.91839599609375, 4.095947265625, 4.27349853515625, 4.4510498046875, 4.62860107421875, 4.80615234375, 4.98370361328125, 5.1612548828125, 5.33880615234375, 5.516357421875, 5.69390869140625, 5.8714599609375, 6.04901123046875, 6.2265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 16.0, 18.0, 20.0, 25.0, 37.0, 75.0, 102.0, 153.0, 225.0, 380.0, 747.0, 1171.0, 2122.0, 3720.0, 6779.0, 12709.0, 26496.0, 142256.0, 764704.0, 46435.0, 18932.0, 9547.0, 5112.0, 2822.0, 1547.0, 897.0, 512.0, 326.0, 222.0, 144.0, 76.0, 53.0, 48.0, 24.0, 10.0, 27.0, 15.0, 10.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.4921875, -10.15673828125, -9.8212890625, -9.48583984375, -9.150390625, -8.81494140625, -8.4794921875, -8.14404296875, -7.80859375, -7.47314453125, -7.1376953125, -6.80224609375, -6.466796875, -6.13134765625, -5.7958984375, -5.46044921875, -5.125, -4.78955078125, -4.4541015625, -4.11865234375, -3.783203125, -3.44775390625, -3.1123046875, -2.77685546875, -2.44140625, -2.10595703125, -1.7705078125, -1.43505859375, -1.099609375, -0.76416015625, -0.4287109375, -0.09326171875, 0.2421875, 0.57763671875, 0.9130859375, 1.24853515625, 1.583984375, 1.91943359375, 2.2548828125, 2.59033203125, 2.92578125, 3.26123046875, 3.5966796875, 3.93212890625, 4.267578125, 4.60302734375, 4.9384765625, 5.27392578125, 5.609375, 5.94482421875, 6.2802734375, 6.61572265625, 6.951171875, 7.28662109375, 7.6220703125, 7.95751953125, 8.29296875, 8.62841796875, 8.9638671875, 9.29931640625, 9.634765625, 9.97021484375, 10.3056640625, 10.64111328125, 10.9765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 7.0, 5.0, 8.0, 6.0, 13.0, 6.0, 16.0, 16.0, 20.0, 23.0, 27.0, 31.0, 33.0, 24.0, 36.0, 41.0, 47.0, 44.0, 50.0, 50.0, 42.0, 45.0, 54.0, 41.0, 38.0, 25.0, 40.0, 32.0, 29.0, 27.0, 23.0, 24.0, 21.0, 16.0, 13.0, 10.0, 5.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9140625, -6.6832275390625, -6.452392578125, -6.2215576171875, -5.99072265625, -5.7598876953125, -5.529052734375, -5.2982177734375, -5.0673828125, -4.8365478515625, -4.605712890625, -4.3748779296875, -4.14404296875, -3.9132080078125, -3.682373046875, -3.4515380859375, -3.220703125, -2.9898681640625, -2.759033203125, -2.5281982421875, -2.29736328125, -2.0665283203125, -1.835693359375, -1.6048583984375, -1.3740234375, -1.1431884765625, -0.912353515625, -0.6815185546875, -0.45068359375, -0.2198486328125, 0.010986328125, 0.2418212890625, 0.47265625, 0.7034912109375, 0.934326171875, 1.1651611328125, 1.39599609375, 1.6268310546875, 1.857666015625, 2.0885009765625, 2.3193359375, 2.5501708984375, 2.781005859375, 3.0118408203125, 3.24267578125, 3.4735107421875, 3.704345703125, 3.9351806640625, 4.166015625, 4.3968505859375, 4.627685546875, 4.8585205078125, 5.08935546875, 5.3201904296875, 5.551025390625, 5.7818603515625, 6.0126953125, 6.2435302734375, 6.474365234375, 6.7052001953125, 6.93603515625, 7.1668701171875, 7.397705078125, 7.6285400390625, 7.859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 9.0, 11.0, 14.0, 24.0, 32.0, 41.0, 49.0, 47.0, 93.0, 112.0, 184.0, 272.0, 327.0, 549.0, 774.0, 1207.0, 1912.0, 3230.0, 5752.0, 11101.0, 24839.0, 108075.0, 760713.0, 82637.0, 22328.0, 10300.0, 5288.0, 3123.0, 1813.0, 1178.0, 761.0, 496.0, 386.0, 257.0, 180.0, 128.0, 82.0, 63.0, 51.0, 25.0, 22.0, 15.0, 13.0, 17.0, 7.0, 6.0, 4.0, 0.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.421875, -2.342315673828125, -2.26275634765625, -2.183197021484375, -2.1036376953125, -2.024078369140625, -1.94451904296875, -1.864959716796875, -1.785400390625, -1.705841064453125, -1.62628173828125, -1.546722412109375, -1.4671630859375, -1.387603759765625, -1.30804443359375, -1.228485107421875, -1.14892578125, -1.069366455078125, -0.98980712890625, -0.910247802734375, -0.8306884765625, -0.751129150390625, -0.67156982421875, -0.592010498046875, -0.512451171875, -0.432891845703125, -0.35333251953125, -0.273773193359375, -0.1942138671875, -0.114654541015625, -0.03509521484375, 0.044464111328125, 0.1240234375, 0.203582763671875, 0.28314208984375, 0.362701416015625, 0.4422607421875, 0.521820068359375, 0.60137939453125, 0.680938720703125, 0.760498046875, 0.840057373046875, 0.91961669921875, 0.999176025390625, 1.0787353515625, 1.158294677734375, 1.23785400390625, 1.317413330078125, 1.39697265625, 1.476531982421875, 1.55609130859375, 1.635650634765625, 1.7152099609375, 1.794769287109375, 1.87432861328125, 1.953887939453125, 2.033447265625, 2.113006591796875, 2.19256591796875, 2.272125244140625, 2.3516845703125, 2.431243896484375, 2.51080322265625, 2.590362548828125, 2.669921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 10.0, 13.0, 20.0, 27.0, 35.0, 40.0, 58.0, 66.0, 86.0, 120.0, 121.0, 81.0, 52.0, 45.0, 41.0, 39.0, 23.0, 21.0, 17.0, 12.0, 14.0, 8.0, 4.0, 8.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008840560913085938, -0.0008595213294029236, -0.0008349865674972534, -0.0008104518055915833, -0.0007859170436859131, -0.0007613822817802429, -0.0007368475198745728, -0.0007123127579689026, -0.0006877779960632324, -0.0006632432341575623, -0.0006387084722518921, -0.0006141737103462219, -0.0005896389484405518, -0.0005651041865348816, -0.0005405694246292114, -0.0005160346627235413, -0.0004914999008178711, -0.00046696513891220093, -0.00044243037700653076, -0.0004178956151008606, -0.00039336085319519043, -0.00036882609128952026, -0.0003442913293838501, -0.00031975656747817993, -0.00029522180557250977, -0.0002706870436668396, -0.00024615228176116943, -0.00022161751985549927, -0.0001970827579498291, -0.00017254799604415894, -0.00014801323413848877, -0.0001234784722328186, -9.894371032714844e-05, -7.440894842147827e-05, -4.9874186515808105e-05, -2.533942461013794e-05, -8.046627044677734e-07, 2.3730099201202393e-05, 4.826486110687256e-05, 7.279962301254272e-05, 9.733438491821289e-05, 0.00012186914682388306, 0.00014640390872955322, 0.0001709386706352234, 0.00019547343254089355, 0.00022000819444656372, 0.0002445429563522339, 0.00026907771825790405, 0.0002936124801635742, 0.0003181472420692444, 0.00034268200397491455, 0.0003672167658805847, 0.0003917515277862549, 0.00041628628969192505, 0.0004408210515975952, 0.0004653558135032654, 0.0004898905754089355, 0.0005144253373146057, 0.0005389600992202759, 0.000563494861125946, 0.0005880296230316162, 0.0006125643849372864, 0.0006370991468429565, 0.0006616339087486267, 0.0006861686706542969]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 12.0, 19.0, 13.0, 30.0, 49.0, 48.0, 93.0, 110.0, 200.0, 288.0, 442.0, 671.0, 1013.0, 1619.0, 2591.0, 4165.0, 6543.0, 11208.0, 18839.0, 33867.0, 62988.0, 118655.0, 200235.0, 229012.0, 159373.0, 87107.0, 46188.0, 25519.0, 14623.0, 8628.0, 5253.0, 3325.0, 2065.0, 1288.0, 822.0, 536.0, 357.0, 250.0, 142.0, 106.0, 93.0, 57.0, 40.0, 21.0, 18.0, 7.0, 9.0, 5.0, 7.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-1.3515625, -1.309661865234375, -1.26776123046875, -1.225860595703125, -1.1839599609375, -1.142059326171875, -1.10015869140625, -1.058258056640625, -1.016357421875, -0.974456787109375, -0.93255615234375, -0.890655517578125, -0.8487548828125, -0.806854248046875, -0.76495361328125, -0.723052978515625, -0.68115234375, -0.639251708984375, -0.59735107421875, -0.555450439453125, -0.5135498046875, -0.471649169921875, -0.42974853515625, -0.387847900390625, -0.345947265625, -0.304046630859375, -0.26214599609375, -0.220245361328125, -0.1783447265625, -0.136444091796875, -0.09454345703125, -0.052642822265625, -0.0107421875, 0.031158447265625, 0.07305908203125, 0.114959716796875, 0.1568603515625, 0.198760986328125, 0.24066162109375, 0.282562255859375, 0.324462890625, 0.366363525390625, 0.40826416015625, 0.450164794921875, 0.4920654296875, 0.533966064453125, 0.57586669921875, 0.617767333984375, 0.65966796875, 0.701568603515625, 0.74346923828125, 0.785369873046875, 0.8272705078125, 0.869171142578125, 0.91107177734375, 0.952972412109375, 0.994873046875, 1.036773681640625, 1.07867431640625, 1.120574951171875, 1.1624755859375, 1.204376220703125, 1.24627685546875, 1.288177490234375, 1.330078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 12.0, 19.0, 16.0, 27.0, 30.0, 40.0, 42.0, 54.0, 57.0, 76.0, 71.0, 68.0, 67.0, 65.0, 70.0, 53.0, 57.0, 45.0, 33.0, 25.0, 15.0, 12.0, 10.0, 8.0, 9.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5462760925292969, -0.5305404663085938, -0.5148048400878906, -0.4990692138671875, -0.4833335876464844, -0.46759796142578125, -0.4518623352050781, -0.436126708984375, -0.4203910827636719, -0.40465545654296875, -0.3889198303222656, -0.3731842041015625, -0.3574485778808594, -0.34171295166015625, -0.3259773254394531, -0.31024169921875, -0.2945060729980469, -0.27877044677734375, -0.2630348205566406, -0.2472991943359375, -0.23156356811523438, -0.21582794189453125, -0.20009231567382812, -0.184356689453125, -0.16862106323242188, -0.15288543701171875, -0.13714981079101562, -0.1214141845703125, -0.10567855834960938, -0.08994293212890625, -0.07420730590820312, -0.0584716796875, -0.042736053466796875, -0.02700042724609375, -0.011264801025390625, 0.0044708251953125, 0.020206451416015625, 0.03594207763671875, 0.051677703857421875, 0.067413330078125, 0.08314895629882812, 0.09888458251953125, 0.11462020874023438, 0.1303558349609375, 0.14609146118164062, 0.16182708740234375, 0.17756271362304688, 0.19329833984375, 0.20903396606445312, 0.22476959228515625, 0.24050521850585938, 0.2562408447265625, 0.2719764709472656, 0.28771209716796875, 0.3034477233886719, 0.319183349609375, 0.3349189758300781, 0.35065460205078125, 0.3663902282714844, 0.3821258544921875, 0.3978614807128906, 0.41359710693359375, 0.4293327331542969, 0.445068359375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 9.0, 8.0, 7.0, 7.0, 22.0, 24.0, 15.0, 14.0, 20.0, 37.0, 36.0, 32.0, 39.0, 28.0, 36.0, 34.0, 47.0, 45.0, 35.0, 51.0, 50.0, 34.0, 41.0, 40.0, 40.0, 33.0, 27.0, 29.0, 21.0, 18.0, 27.0, 12.0, 7.0, 9.0, 13.0, 8.0, 6.0, 5.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.1258015632629395, -4.959199905395508, -4.792597770690918, -4.625996112823486, -4.4593939781188965, -4.292792320251465, -4.126190185546875, -3.9595885276794434, -3.7929866313934326, -3.626384735107422, -3.459782838821411, -3.2931809425354004, -3.1265792846679688, -2.959977149963379, -2.7933754920959473, -2.6267735958099365, -2.460171699523926, -2.293569803237915, -2.1269679069519043, -1.960366129875183, -1.7937642335891724, -1.6271623373031616, -1.4605605602264404, -1.2939586639404297, -1.127356767654419, -0.9607548713684082, -0.7941530346870422, -0.6275511980056763, -0.4609493017196655, -0.2943474054336548, -0.12774556875228882, 0.03885626792907715, 0.2054581642150879, 0.37206003069877625, 0.5386618971824646, 0.7052637338638306, 0.8718656301498413, 1.038467526435852, 1.2050693035125732, 1.371671199798584, 1.5382730960845947, 1.7048749923706055, 1.8714768886566162, 2.038078784942627, 2.2046804428100586, 2.3712825775146484, 2.53788423538208, 2.704486131668091, 2.8710880279541016, 3.0376899242401123, 3.204291820526123, 3.370893716812134, 3.5374956130981445, 3.704097270965576, 3.870699167251587, 4.037301063537598, 4.2039031982421875, 4.370504856109619, 4.537106990814209, 4.703708648681641, 4.8703107833862305, 5.036912441253662, 5.203514575958252, 5.370116233825684, 5.536717891693115]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 5.0, 5.0, 9.0, 10.0, 13.0, 9.0, 9.0, 11.0, 25.0, 20.0, 29.0, 29.0, 27.0, 29.0, 26.0, 29.0, 39.0, 31.0, 53.0, 36.0, 43.0, 44.0, 50.0, 42.0, 51.0, 38.0, 32.0, 32.0, 36.0, 20.0, 24.0, 19.0, 20.0, 18.0, 13.0, 9.0, 14.0, 13.0, 4.0, 10.0, 10.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-5.595176696777344, -5.419276237487793, -5.243375778198242, -5.067475318908691, -4.891574859619141, -4.71567440032959, -4.539773941040039, -4.363873481750488, -4.1879730224609375, -4.012072563171387, -3.836172103881836, -3.660271644592285, -3.4843711853027344, -3.3084707260131836, -3.132570266723633, -2.956669807434082, -2.780769109725952, -2.6048686504364014, -2.4289681911468506, -2.2530677318573, -2.077167272567749, -1.9012668132781982, -1.725366234779358, -1.5494657754898071, -1.3735653162002563, -1.1976648569107056, -1.0217643976211548, -0.8458638787269592, -0.6699634194374084, -0.49406296014785767, -0.3181624412536621, -0.14226198196411133, 0.03363847732543945, 0.20953895151615143, 0.3854394257068634, 0.5613399147987366, 0.7372403740882874, 0.9131408333778381, 1.0890413522720337, 1.2649418115615845, 1.4408422708511353, 1.616742730140686, 1.7926431894302368, 1.9685437679290771, 2.144444227218628, 2.3203446865081787, 2.4962451457977295, 2.6721456050872803, 2.848046064376831, 3.023946523666382, 3.1998469829559326, 3.3757474422454834, 3.551647901535034, 3.727548360824585, 3.903449058532715, 4.079349517822266, 4.255249977111816, 4.431150436401367, 4.607050895690918, 4.782951354980469, 4.9588518142700195, 5.13475227355957, 5.310652732849121, 5.486553192138672, 5.662453651428223]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 8.0, 11.0, 13.0, 16.0, 29.0, 46.0, 65.0, 95.0, 137.0, 223.0, 379.0, 600.0, 945.0, 1530.0, 2545.0, 4180.0, 6875.0, 11203.0, 17998.0, 28680.0, 44605.0, 66072.0, 92495.0, 116977.0, 132431.0, 131832.0, 115576.0, 90745.0, 65435.0, 43261.0, 27849.0, 17533.0, 10900.0, 6568.0, 4077.0, 2548.0, 1562.0, 952.0, 593.0, 341.0, 220.0, 123.0, 107.0, 56.0, 40.0, 39.0, 23.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.16015625, -5.003662109375, -4.84716796875, -4.690673828125, -4.5341796875, -4.377685546875, -4.22119140625, -4.064697265625, -3.908203125, -3.751708984375, -3.59521484375, -3.438720703125, -3.2822265625, -3.125732421875, -2.96923828125, -2.812744140625, -2.65625, -2.499755859375, -2.34326171875, -2.186767578125, -2.0302734375, -1.873779296875, -1.71728515625, -1.560791015625, -1.404296875, -1.247802734375, -1.09130859375, -0.934814453125, -0.7783203125, -0.621826171875, -0.46533203125, -0.308837890625, -0.15234375, 0.004150390625, 0.16064453125, 0.317138671875, 0.4736328125, 0.630126953125, 0.78662109375, 0.943115234375, 1.099609375, 1.256103515625, 1.41259765625, 1.569091796875, 1.7255859375, 1.882080078125, 2.03857421875, 2.195068359375, 2.3515625, 2.508056640625, 2.66455078125, 2.821044921875, 2.9775390625, 3.134033203125, 3.29052734375, 3.447021484375, 3.603515625, 3.760009765625, 3.91650390625, 4.072998046875, 4.2294921875, 4.385986328125, 4.54248046875, 4.698974609375, 4.85546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 9.0, 5.0, 6.0, 6.0, 14.0, 16.0, 19.0, 19.0, 17.0, 25.0, 22.0, 26.0, 37.0, 41.0, 36.0, 36.0, 47.0, 41.0, 41.0, 47.0, 33.0, 47.0, 45.0, 34.0, 43.0, 31.0, 48.0, 18.0, 24.0, 22.0, 23.0, 21.0, 15.0, 16.0, 10.0, 9.0, 10.0, 9.0, 11.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.96875, -4.79559326171875, -4.6224365234375, -4.44927978515625, -4.276123046875, -4.10296630859375, -3.9298095703125, -3.75665283203125, -3.58349609375, -3.41033935546875, -3.2371826171875, -3.06402587890625, -2.890869140625, -2.71771240234375, -2.5445556640625, -2.37139892578125, -2.1982421875, -2.02508544921875, -1.8519287109375, -1.67877197265625, -1.505615234375, -1.33245849609375, -1.1593017578125, -0.98614501953125, -0.81298828125, -0.63983154296875, -0.4666748046875, -0.29351806640625, -0.120361328125, 0.05279541015625, 0.2259521484375, 0.39910888671875, 0.572265625, 0.74542236328125, 0.9185791015625, 1.09173583984375, 1.264892578125, 1.43804931640625, 1.6112060546875, 1.78436279296875, 1.95751953125, 2.13067626953125, 2.3038330078125, 2.47698974609375, 2.650146484375, 2.82330322265625, 2.9964599609375, 3.16961669921875, 3.3427734375, 3.51593017578125, 3.6890869140625, 3.86224365234375, 4.035400390625, 4.20855712890625, 4.3817138671875, 4.55487060546875, 4.72802734375, 4.90118408203125, 5.0743408203125, 5.24749755859375, 5.420654296875, 5.59381103515625, 5.7669677734375, 5.94012451171875, 6.11328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 12.0, 19.0, 23.0, 34.0, 50.0, 104.0, 153.0, 282.0, 433.0, 802.0, 1260.0, 2063.0, 3382.0, 5818.0, 9493.0, 15578.0, 25743.0, 40473.0, 62118.0, 88896.0, 117142.0, 136394.0, 138820.0, 121866.0, 94672.0, 67272.0, 43992.0, 27617.0, 17458.0, 10543.0, 6307.0, 3843.0, 2354.0, 1448.0, 845.0, 491.0, 307.0, 198.0, 91.0, 61.0, 40.0, 19.0, 11.0, 12.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.33203125, -7.11700439453125, -6.9019775390625, -6.68695068359375, -6.471923828125, -6.25689697265625, -6.0418701171875, -5.82684326171875, -5.61181640625, -5.39678955078125, -5.1817626953125, -4.96673583984375, -4.751708984375, -4.53668212890625, -4.3216552734375, -4.10662841796875, -3.8916015625, -3.67657470703125, -3.4615478515625, -3.24652099609375, -3.031494140625, -2.81646728515625, -2.6014404296875, -2.38641357421875, -2.17138671875, -1.95635986328125, -1.7413330078125, -1.52630615234375, -1.311279296875, -1.09625244140625, -0.8812255859375, -0.66619873046875, -0.451171875, -0.23614501953125, -0.0211181640625, 0.19390869140625, 0.408935546875, 0.62396240234375, 0.8389892578125, 1.05401611328125, 1.26904296875, 1.48406982421875, 1.6990966796875, 1.91412353515625, 2.129150390625, 2.34417724609375, 2.5592041015625, 2.77423095703125, 2.9892578125, 3.20428466796875, 3.4193115234375, 3.63433837890625, 3.849365234375, 4.06439208984375, 4.2794189453125, 4.49444580078125, 4.70947265625, 4.92449951171875, 5.1395263671875, 5.35455322265625, 5.569580078125, 5.78460693359375, 5.9996337890625, 6.21466064453125, 6.4296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 5.0, 6.0, 9.0, 8.0, 8.0, 19.0, 10.0, 18.0, 21.0, 33.0, 34.0, 32.0, 29.0, 43.0, 31.0, 33.0, 31.0, 43.0, 41.0, 38.0, 44.0, 45.0, 40.0, 39.0, 48.0, 44.0, 28.0, 39.0, 27.0, 25.0, 20.0, 21.0, 13.0, 19.0, 19.0, 7.0, 8.0, 4.0, 9.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8203125, -3.6961669921875, -3.572021484375, -3.4478759765625, -3.32373046875, -3.1995849609375, -3.075439453125, -2.9512939453125, -2.8271484375, -2.7030029296875, -2.578857421875, -2.4547119140625, -2.33056640625, -2.2064208984375, -2.082275390625, -1.9581298828125, -1.833984375, -1.7098388671875, -1.585693359375, -1.4615478515625, -1.33740234375, -1.2132568359375, -1.089111328125, -0.9649658203125, -0.8408203125, -0.7166748046875, -0.592529296875, -0.4683837890625, -0.34423828125, -0.2200927734375, -0.095947265625, 0.0281982421875, 0.15234375, 0.2764892578125, 0.400634765625, 0.5247802734375, 0.64892578125, 0.7730712890625, 0.897216796875, 1.0213623046875, 1.1455078125, 1.2696533203125, 1.393798828125, 1.5179443359375, 1.64208984375, 1.7662353515625, 1.890380859375, 2.0145263671875, 2.138671875, 2.2628173828125, 2.386962890625, 2.5111083984375, 2.63525390625, 2.7593994140625, 2.883544921875, 3.0076904296875, 3.1318359375, 3.2559814453125, 3.380126953125, 3.5042724609375, 3.62841796875, 3.7525634765625, 3.876708984375, 4.0008544921875, 4.125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 12.0, 9.0, 24.0, 17.0, 32.0, 44.0, 72.0, 98.0, 134.0, 260.0, 330.0, 571.0, 951.0, 1674.0, 3124.0, 6257.0, 12862.0, 27467.0, 61680.0, 130233.0, 224468.0, 250409.0, 169216.0, 85032.0, 38719.0, 17119.0, 8358.0, 4049.0, 2111.0, 1237.0, 683.0, 443.0, 288.0, 184.0, 116.0, 65.0, 59.0, 45.0, 20.0, 20.0, 18.0, 9.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.927734375, -3.8094482421875, -3.691162109375, -3.5728759765625, -3.45458984375, -3.3363037109375, -3.218017578125, -3.0997314453125, -2.9814453125, -2.8631591796875, -2.744873046875, -2.6265869140625, -2.50830078125, -2.3900146484375, -2.271728515625, -2.1534423828125, -2.03515625, -1.9168701171875, -1.798583984375, -1.6802978515625, -1.56201171875, -1.4437255859375, -1.325439453125, -1.2071533203125, -1.0888671875, -0.9705810546875, -0.852294921875, -0.7340087890625, -0.61572265625, -0.4974365234375, -0.379150390625, -0.2608642578125, -0.142578125, -0.0242919921875, 0.093994140625, 0.2122802734375, 0.33056640625, 0.4488525390625, 0.567138671875, 0.6854248046875, 0.8037109375, 0.9219970703125, 1.040283203125, 1.1585693359375, 1.27685546875, 1.3951416015625, 1.513427734375, 1.6317138671875, 1.75, 1.8682861328125, 1.986572265625, 2.1048583984375, 2.22314453125, 2.3414306640625, 2.459716796875, 2.5780029296875, 2.6962890625, 2.8145751953125, 2.932861328125, 3.0511474609375, 3.16943359375, 3.2877197265625, 3.406005859375, 3.5242919921875, 3.642578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 2.0, 6.0, 9.0, 8.0, 20.0, 18.0, 27.0, 40.0, 38.0, 50.0, 73.0, 78.0, 78.0, 114.0, 85.0, 77.0, 60.0, 44.0, 51.0, 32.0, 28.0, 12.0, 13.0, 9.0, 12.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003337860107421875, -0.00032111629843711853, -0.00030844658613204956, -0.0002957768738269806, -0.0002831071615219116, -0.00027043744921684265, -0.0002577677369117737, -0.0002450980246067047, -0.00023242831230163574, -0.00021975859999656677, -0.0002070888876914978, -0.00019441917538642883, -0.00018174946308135986, -0.0001690797507762909, -0.00015641003847122192, -0.00014374032616615295, -0.00013107061386108398, -0.00011840090155601501, -0.00010573118925094604, -9.306147694587708e-05, -8.03917646408081e-05, -6.772205233573914e-05, -5.5052340030670166e-05, -4.2382627725601196e-05, -2.9712915420532227e-05, -1.7043203115463257e-05, -4.373490810394287e-06, 8.296221494674683e-06, 2.0965933799743652e-05, 3.363564610481262e-05, 4.630535840988159e-05, 5.897507071495056e-05, 7.164478302001953e-05, 8.43144953250885e-05, 9.698420763015747e-05, 0.00010965391993522644, 0.0001223236322402954, 0.00013499334454536438, 0.00014766305685043335, 0.00016033276915550232, 0.0001730024814605713, 0.00018567219376564026, 0.00019834190607070923, 0.0002110116183757782, 0.00022368133068084717, 0.00023635104298591614, 0.0002490207552909851, 0.0002616904675960541, 0.00027436017990112305, 0.000287029892206192, 0.000299699604511261, 0.00031236931681632996, 0.0003250390291213989, 0.0003377087414264679, 0.00035037845373153687, 0.00036304816603660583, 0.0003757178783416748, 0.0003883875906467438, 0.00040105730295181274, 0.0004137270152568817, 0.0004263967275619507, 0.00043906643986701965, 0.0004517361521720886, 0.0004644058644771576, 0.00047707557678222656]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 13.0, 14.0, 22.0, 32.0, 39.0, 58.0, 87.0, 169.0, 222.0, 362.0, 597.0, 1071.0, 1901.0, 3533.0, 7136.0, 15521.0, 34861.0, 78876.0, 161166.0, 246764.0, 233057.0, 141153.0, 66453.0, 29021.0, 13062.0, 6145.0, 3119.0, 1647.0, 953.0, 526.0, 331.0, 195.0, 149.0, 92.0, 58.0, 41.0, 23.0, 23.0, 14.0, 8.0, 9.0, 4.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.8125, -3.69659423828125, -3.5806884765625, -3.46478271484375, -3.348876953125, -3.23297119140625, -3.1170654296875, -3.00115966796875, -2.88525390625, -2.76934814453125, -2.6534423828125, -2.53753662109375, -2.421630859375, -2.30572509765625, -2.1898193359375, -2.07391357421875, -1.9580078125, -1.84210205078125, -1.7261962890625, -1.61029052734375, -1.494384765625, -1.37847900390625, -1.2625732421875, -1.14666748046875, -1.03076171875, -0.91485595703125, -0.7989501953125, -0.68304443359375, -0.567138671875, -0.45123291015625, -0.3353271484375, -0.21942138671875, -0.103515625, 0.01239013671875, 0.1282958984375, 0.24420166015625, 0.360107421875, 0.47601318359375, 0.5919189453125, 0.70782470703125, 0.82373046875, 0.93963623046875, 1.0555419921875, 1.17144775390625, 1.287353515625, 1.40325927734375, 1.5191650390625, 1.63507080078125, 1.7509765625, 1.86688232421875, 1.9827880859375, 2.09869384765625, 2.214599609375, 2.33050537109375, 2.4464111328125, 2.56231689453125, 2.67822265625, 2.79412841796875, 2.9100341796875, 3.02593994140625, 3.141845703125, 3.25775146484375, 3.3736572265625, 3.48956298828125, 3.60546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 10.0, 16.0, 14.0, 22.0, 20.0, 26.0, 24.0, 40.0, 45.0, 43.0, 56.0, 60.0, 65.0, 48.0, 75.0, 52.0, 52.0, 49.0, 49.0, 44.0, 40.0, 34.0, 20.0, 22.0, 20.0, 10.0, 17.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.162109375, -1.128326416015625, -1.09454345703125, -1.060760498046875, -1.0269775390625, -0.993194580078125, -0.95941162109375, -0.925628662109375, -0.891845703125, -0.858062744140625, -0.82427978515625, -0.790496826171875, -0.7567138671875, -0.722930908203125, -0.68914794921875, -0.655364990234375, -0.62158203125, -0.587799072265625, -0.55401611328125, -0.520233154296875, -0.4864501953125, -0.452667236328125, -0.41888427734375, -0.385101318359375, -0.351318359375, -0.317535400390625, -0.28375244140625, -0.249969482421875, -0.2161865234375, -0.182403564453125, -0.14862060546875, -0.114837646484375, -0.0810546875, -0.047271728515625, -0.01348876953125, 0.020294189453125, 0.0540771484375, 0.087860107421875, 0.12164306640625, 0.155426025390625, 0.189208984375, 0.222991943359375, 0.25677490234375, 0.290557861328125, 0.3243408203125, 0.358123779296875, 0.39190673828125, 0.425689697265625, 0.45947265625, 0.493255615234375, 0.52703857421875, 0.560821533203125, 0.5946044921875, 0.628387451171875, 0.66217041015625, 0.695953369140625, 0.729736328125, 0.763519287109375, 0.79730224609375, 0.831085205078125, 0.8648681640625, 0.898651123046875, 0.93243408203125, 0.966217041015625, 1.0]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 10.0, 18.0, 17.0, 13.0, 18.0, 21.0, 24.0, 29.0, 34.0, 24.0, 39.0, 43.0, 27.0, 34.0, 37.0, 51.0, 56.0, 42.0, 46.0, 40.0, 42.0, 47.0, 30.0, 36.0, 33.0, 24.0, 30.0, 14.0, 20.0, 13.0, 9.0, 10.0, 10.0, 10.0, 2.0, 8.0, 7.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.267155170440674, -5.094008445739746, -4.92086124420166, -4.747714042663574, -4.5745673179626465, -4.401420593261719, -4.228273391723633, -4.055126190185547, -3.881979465484619, -3.7088325023651123, -3.5356855392456055, -3.3625385761260986, -3.189391613006592, -3.016244649887085, -2.843097686767578, -2.6699507236480713, -2.4968037605285645, -2.3236567974090576, -2.150509834289551, -1.977362871170044, -1.804215908050537, -1.6310689449310303, -1.4579219818115234, -1.2847750186920166, -1.1116280555725098, -0.9384810924530029, -0.7653341293334961, -0.5921871662139893, -0.4190402030944824, -0.24589323997497559, -0.07274627685546875, 0.10040068626403809, 0.2735481262207031, 0.44669508934020996, 0.6198420524597168, 0.7929890155792236, 0.9661359786987305, 1.1392829418182373, 1.3124299049377441, 1.485576868057251, 1.6587238311767578, 1.8318707942962646, 2.0050177574157715, 2.1781647205352783, 2.351311683654785, 2.524458646774292, 2.697605609893799, 2.8707525730133057, 3.0438995361328125, 3.2170464992523193, 3.390193462371826, 3.563340425491333, 3.73648738861084, 3.9096343517303467, 4.0827813148498535, 4.255928039550781, 4.429075241088867, 4.602222442626953, 4.775369167327881, 4.948515892028809, 5.1216630935668945, 5.2948102951049805, 5.467957019805908, 5.641103744506836, 5.814250946044922]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 7.0, 6.0, 5.0, 8.0, 11.0, 16.0, 18.0, 14.0, 13.0, 16.0, 24.0, 25.0, 26.0, 30.0, 29.0, 34.0, 43.0, 52.0, 40.0, 45.0, 44.0, 58.0, 41.0, 43.0, 45.0, 33.0, 40.0, 32.0, 26.0, 20.0, 21.0, 22.0, 22.0, 18.0, 16.0, 12.0, 10.0, 8.0, 10.0, 2.0, 7.0, 5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.63241720199585, -5.442363739013672, -5.252310752868652, -5.062257766723633, -4.872204303741455, -4.682150840759277, -4.492097854614258, -4.302044868469238, -4.1119914054870605, -3.921938180923462, -3.7318849563598633, -3.5418317317962646, -3.351778507232666, -3.1617252826690674, -2.9716720581054688, -2.78161883354187, -2.5915656089782715, -2.401512384414673, -2.211459159851074, -2.0214059352874756, -1.831352710723877, -1.6412994861602783, -1.4512462615966797, -1.261193037033081, -1.0711398124694824, -0.8810865879058838, -0.6910333633422852, -0.5009801387786865, -0.3109269142150879, -0.12087368965148926, 0.06917953491210938, 0.259232759475708, 0.44928646087646484, 0.6393396854400635, 0.8293929100036621, 1.0194461345672607, 1.2094993591308594, 1.399552583694458, 1.5896058082580566, 1.7796590328216553, 1.969712257385254, 2.1597654819488525, 2.349818706512451, 2.53987193107605, 2.7299251556396484, 2.919978380203247, 3.1100316047668457, 3.3000848293304443, 3.490138053894043, 3.6801912784576416, 3.8702445030212402, 4.060297966003418, 4.2503509521484375, 4.440403938293457, 4.630457401275635, 4.8205108642578125, 5.010563850402832, 5.200616836547852, 5.390670299530029, 5.580723762512207, 5.770776748657227, 5.960829734802246, 6.150883197784424, 6.340936660766602, 6.530989646911621]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 13.0, 22.0, 29.0, 41.0, 67.0, 97.0, 146.0, 207.0, 362.0, 570.0, 913.0, 1495.0, 2400.0, 4255.0, 7244.0, 12855.0, 23271.0, 43738.0, 83904.0, 159887.0, 296558.0, 494769.0, 690852.0, 761760.0, 642696.0, 432380.0, 248061.0, 131884.0, 69289.0, 36928.0, 20206.0, 11299.0, 6375.0, 3830.0, 2273.0, 1395.0, 869.0, 501.0, 283.0, 213.0, 131.0, 72.0, 44.0, 38.0, 14.0, 20.0, 14.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90234375, -4.7408447265625, -4.579345703125, -4.4178466796875, -4.25634765625, -4.0948486328125, -3.933349609375, -3.7718505859375, -3.6103515625, -3.4488525390625, -3.287353515625, -3.1258544921875, -2.96435546875, -2.8028564453125, -2.641357421875, -2.4798583984375, -2.318359375, -2.1568603515625, -1.995361328125, -1.8338623046875, -1.67236328125, -1.5108642578125, -1.349365234375, -1.1878662109375, -1.0263671875, -0.8648681640625, -0.703369140625, -0.5418701171875, -0.38037109375, -0.2188720703125, -0.057373046875, 0.1041259765625, 0.265625, 0.4271240234375, 0.588623046875, 0.7501220703125, 0.91162109375, 1.0731201171875, 1.234619140625, 1.3961181640625, 1.5576171875, 1.7191162109375, 1.880615234375, 2.0421142578125, 2.20361328125, 2.3651123046875, 2.526611328125, 2.6881103515625, 2.849609375, 3.0111083984375, 3.172607421875, 3.3341064453125, 3.49560546875, 3.6571044921875, 3.818603515625, 3.9801025390625, 4.1416015625, 4.3031005859375, 4.464599609375, 4.6260986328125, 4.78759765625, 4.9490966796875, 5.110595703125, 5.2720947265625, 5.43359375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 10.0, 10.0, 12.0, 17.0, 16.0, 21.0, 20.0, 24.0, 23.0, 28.0, 21.0, 46.0, 38.0, 53.0, 39.0, 48.0, 50.0, 46.0, 46.0, 48.0, 34.0, 37.0, 44.0, 35.0, 34.0, 19.0, 22.0, 22.0, 27.0, 15.0, 16.0, 11.0, 15.0, 10.0, 8.0, 9.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.817626953125, -4.64697265625, -4.476318359375, -4.3056640625, -4.135009765625, -3.96435546875, -3.793701171875, -3.623046875, -3.452392578125, -3.28173828125, -3.111083984375, -2.9404296875, -2.769775390625, -2.59912109375, -2.428466796875, -2.2578125, -2.087158203125, -1.91650390625, -1.745849609375, -1.5751953125, -1.404541015625, -1.23388671875, -1.063232421875, -0.892578125, -0.721923828125, -0.55126953125, -0.380615234375, -0.2099609375, -0.039306640625, 0.13134765625, 0.302001953125, 0.47265625, 0.643310546875, 0.81396484375, 0.984619140625, 1.1552734375, 1.325927734375, 1.49658203125, 1.667236328125, 1.837890625, 2.008544921875, 2.17919921875, 2.349853515625, 2.5205078125, 2.691162109375, 2.86181640625, 3.032470703125, 3.203125, 3.373779296875, 3.54443359375, 3.715087890625, 3.8857421875, 4.056396484375, 4.22705078125, 4.397705078125, 4.568359375, 4.739013671875, 4.90966796875, 5.080322265625, 5.2509765625, 5.421630859375, 5.59228515625, 5.762939453125, 5.93359375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 9.0, 11.0, 9.0, 17.0, 27.0, 47.0, 78.0, 97.0, 143.0, 229.0, 377.0, 555.0, 841.0, 1330.0, 2006.0, 3261.0, 5233.0, 8202.0, 12995.0, 20957.0, 33756.0, 53859.0, 85253.0, 135929.0, 206755.0, 302744.0, 418256.0, 521562.0, 564152.0, 521211.0, 418861.0, 304097.0, 206161.0, 135082.0, 86573.0, 53844.0, 33595.0, 20765.0, 12983.0, 8265.0, 5148.0, 3183.0, 2056.0, 1298.0, 846.0, 574.0, 382.0, 234.0, 161.0, 90.0, 73.0, 41.0, 31.0, 17.0, 10.0, 12.0, 5.0, 2.0, 3.0, 2.0, 2.0], "bins": [-4.55859375, -4.41387939453125, -4.2691650390625, -4.12445068359375, -3.979736328125, -3.83502197265625, -3.6903076171875, -3.54559326171875, -3.40087890625, -3.25616455078125, -3.1114501953125, -2.96673583984375, -2.822021484375, -2.67730712890625, -2.5325927734375, -2.38787841796875, -2.2431640625, -2.09844970703125, -1.9537353515625, -1.80902099609375, -1.664306640625, -1.51959228515625, -1.3748779296875, -1.23016357421875, -1.08544921875, -0.94073486328125, -0.7960205078125, -0.65130615234375, -0.506591796875, -0.36187744140625, -0.2171630859375, -0.07244873046875, 0.072265625, 0.21697998046875, 0.3616943359375, 0.50640869140625, 0.651123046875, 0.79583740234375, 0.9405517578125, 1.08526611328125, 1.22998046875, 1.37469482421875, 1.5194091796875, 1.66412353515625, 1.808837890625, 1.95355224609375, 2.0982666015625, 2.24298095703125, 2.3876953125, 2.53240966796875, 2.6771240234375, 2.82183837890625, 2.966552734375, 3.11126708984375, 3.2559814453125, 3.40069580078125, 3.54541015625, 3.69012451171875, 3.8348388671875, 3.97955322265625, 4.124267578125, 4.26898193359375, 4.4136962890625, 4.55841064453125, 4.703125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 9.0, 6.0, 7.0, 23.0, 21.0, 31.0, 46.0, 47.0, 42.0, 71.0, 86.0, 119.0, 146.0, 169.0, 187.0, 217.0, 236.0, 250.0, 242.0, 227.0, 261.0, 241.0, 230.0, 215.0, 192.0, 153.0, 115.0, 114.0, 86.0, 62.0, 46.0, 33.0, 46.0, 24.0, 16.0, 16.0, 15.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33203125, -2.25518798828125, -2.1783447265625, -2.10150146484375, -2.024658203125, -1.94781494140625, -1.8709716796875, -1.79412841796875, -1.71728515625, -1.64044189453125, -1.5635986328125, -1.48675537109375, -1.409912109375, -1.33306884765625, -1.2562255859375, -1.17938232421875, -1.1025390625, -1.02569580078125, -0.9488525390625, -0.87200927734375, -0.795166015625, -0.71832275390625, -0.6414794921875, -0.56463623046875, -0.48779296875, -0.41094970703125, -0.3341064453125, -0.25726318359375, -0.180419921875, -0.10357666015625, -0.0267333984375, 0.05010986328125, 0.126953125, 0.20379638671875, 0.2806396484375, 0.35748291015625, 0.434326171875, 0.51116943359375, 0.5880126953125, 0.66485595703125, 0.74169921875, 0.81854248046875, 0.8953857421875, 0.97222900390625, 1.049072265625, 1.12591552734375, 1.2027587890625, 1.27960205078125, 1.3564453125, 1.43328857421875, 1.5101318359375, 1.58697509765625, 1.663818359375, 1.74066162109375, 1.8175048828125, 1.89434814453125, 1.97119140625, 2.04803466796875, 2.1248779296875, 2.20172119140625, 2.278564453125, 2.35540771484375, 2.4322509765625, 2.50909423828125, 2.5859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 5.0, 3.0, 1.0, 5.0, 8.0, 9.0, 10.0, 18.0, 12.0, 13.0, 20.0, 23.0, 19.0, 23.0, 16.0, 31.0, 27.0, 33.0, 36.0, 38.0, 31.0, 45.0, 45.0, 40.0, 49.0, 39.0, 39.0, 49.0, 32.0, 42.0, 33.0, 28.0, 29.0, 26.0, 21.0, 12.0, 16.0, 13.0, 10.0, 14.0, 11.0, 7.0, 5.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.788973808288574, -4.6274285316467285, -4.465882778167725, -4.304337501525879, -4.142792224884033, -3.9812467098236084, -3.8197011947631836, -3.658155918121338, -3.496610403060913, -3.3350648880004883, -3.1735196113586426, -3.0119740962982178, -2.850428581237793, -2.6888833045959473, -2.5273377895355225, -2.3657922744750977, -2.204246997833252, -2.042701482772827, -1.8811562061309814, -1.7196106910705566, -1.5580652952194214, -1.3965198993682861, -1.2349743843078613, -1.073428988456726, -0.9118835926055908, -0.7503381967544556, -0.5887927412986755, -0.4272473156452179, -0.26570188999176025, -0.104156494140625, 0.05738896131515503, 0.21893441677093506, 0.3804802894592285, 0.5420256853103638, 0.7035711407661438, 0.8651165962219238, 1.026661992073059, 1.1882073879241943, 1.3497529029846191, 1.5112982988357544, 1.6728436946868896, 1.834389090538025, 1.9959344863891602, 2.157480001449585, 2.3190255165100098, 2.4805707931518555, 2.6421163082122803, 2.803661823272705, 2.965207099914551, 3.1267526149749756, 3.2882978916168213, 3.449843406677246, 3.611388683319092, 3.7729341983795166, 3.9344797134399414, 4.096024990081787, 4.257570266723633, 4.4191155433654785, 4.580661296844482, 4.742206573486328, 4.903751850128174, 5.0652971267700195, 5.226842880249023, 5.388388156890869, 5.549933910369873]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 11.0, 9.0, 2.0, 10.0, 18.0, 11.0, 15.0, 16.0, 23.0, 26.0, 16.0, 23.0, 33.0, 36.0, 27.0, 39.0, 39.0, 42.0, 44.0, 53.0, 47.0, 43.0, 39.0, 29.0, 51.0, 49.0, 35.0, 28.0, 27.0, 19.0, 16.0, 19.0, 11.0, 10.0, 12.0, 10.0, 16.0, 13.0, 7.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0], "bins": [-6.338786602020264, -6.1554999351501465, -5.972213268280029, -5.788926601409912, -5.605639934539795, -5.422353267669678, -5.2390666007995605, -5.055779933929443, -4.872493267059326, -4.689206600189209, -4.505919933319092, -4.322633266448975, -4.139346599578857, -3.9560599327087402, -3.772773265838623, -3.589486598968506, -3.4062001705169678, -3.2229135036468506, -3.0396268367767334, -2.856340169906616, -2.673053503036499, -2.489766836166382, -2.3064804077148438, -2.1231937408447266, -1.9399069547653198, -1.7566202878952026, -1.5733336210250854, -1.3900470733642578, -1.2067604064941406, -1.0234737396240234, -0.8401870727539062, -0.6569004058837891, -0.4736137390136719, -0.2903270721435547, -0.10704043507575989, 0.07624620199203491, 0.2595328688621521, 0.4428195357322693, 0.6261061429977417, 0.8093928098678589, 0.9926794767379761, 1.1759661436080933, 1.3592528104782104, 1.542539358139038, 1.7258260250091553, 1.9091126918792725, 2.0923993587493896, 2.275686025619507, 2.458972692489624, 2.642259359359741, 2.8255460262298584, 3.0088326930999756, 3.1921193599700928, 3.37540602684021, 3.558692455291748, 3.7419791221618652, 3.9252657890319824, 4.1085524559021, 4.291839122772217, 4.475125789642334, 4.658412456512451, 4.841699123382568, 5.0249857902526855, 5.208272457122803, 5.39155912399292]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 10.0, 14.0, 28.0, 47.0, 74.0, 127.0, 212.0, 298.0, 485.0, 744.0, 1182.0, 1903.0, 2975.0, 4610.0, 7129.0, 10688.0, 15656.0, 23056.0, 32252.0, 43959.0, 57175.0, 72141.0, 85179.0, 95446.0, 99781.0, 97593.0, 89825.0, 77100.0, 62474.0, 49487.0, 36839.0, 26314.0, 18135.0, 12292.0, 8233.0, 5487.0, 3502.0, 2270.0, 1455.0, 909.0, 545.0, 337.0, 208.0, 128.0, 97.0, 49.0, 33.0, 32.0, 16.0, 8.0, 6.0, 8.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.21875, -2.14874267578125, -2.0787353515625, -2.00872802734375, -1.938720703125, -1.86871337890625, -1.7987060546875, -1.72869873046875, -1.65869140625, -1.58868408203125, -1.5186767578125, -1.44866943359375, -1.378662109375, -1.30865478515625, -1.2386474609375, -1.16864013671875, -1.0986328125, -1.02862548828125, -0.9586181640625, -0.88861083984375, -0.818603515625, -0.74859619140625, -0.6785888671875, -0.60858154296875, -0.53857421875, -0.46856689453125, -0.3985595703125, -0.32855224609375, -0.258544921875, -0.18853759765625, -0.1185302734375, -0.04852294921875, 0.021484375, 0.09149169921875, 0.1614990234375, 0.23150634765625, 0.301513671875, 0.37152099609375, 0.4415283203125, 0.51153564453125, 0.58154296875, 0.65155029296875, 0.7215576171875, 0.79156494140625, 0.861572265625, 0.93157958984375, 1.0015869140625, 1.07159423828125, 1.1416015625, 1.21160888671875, 1.2816162109375, 1.35162353515625, 1.421630859375, 1.49163818359375, 1.5616455078125, 1.63165283203125, 1.70166015625, 1.77166748046875, 1.8416748046875, 1.91168212890625, 1.981689453125, 2.05169677734375, 2.1217041015625, 2.19171142578125, 2.26171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 4.0, 11.0, 10.0, 8.0, 17.0, 18.0, 18.0, 16.0, 19.0, 25.0, 35.0, 29.0, 32.0, 36.0, 41.0, 32.0, 43.0, 45.0, 47.0, 47.0, 45.0, 50.0, 41.0, 35.0, 32.0, 41.0, 22.0, 25.0, 27.0, 21.0, 17.0, 16.0, 4.0, 15.0, 11.0, 12.0, 13.0, 9.0, 8.0, 4.0, 7.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.75390625, -5.57989501953125, -5.4058837890625, -5.23187255859375, -5.057861328125, -4.88385009765625, -4.7098388671875, -4.53582763671875, -4.36181640625, -4.18780517578125, -4.0137939453125, -3.83978271484375, -3.665771484375, -3.49176025390625, -3.3177490234375, -3.14373779296875, -2.9697265625, -2.79571533203125, -2.6217041015625, -2.44769287109375, -2.273681640625, -2.09967041015625, -1.9256591796875, -1.75164794921875, -1.57763671875, -1.40362548828125, -1.2296142578125, -1.05560302734375, -0.881591796875, -0.70758056640625, -0.5335693359375, -0.35955810546875, -0.185546875, -0.01153564453125, 0.1624755859375, 0.33648681640625, 0.510498046875, 0.68450927734375, 0.8585205078125, 1.03253173828125, 1.20654296875, 1.38055419921875, 1.5545654296875, 1.72857666015625, 1.902587890625, 2.07659912109375, 2.2506103515625, 2.42462158203125, 2.5986328125, 2.77264404296875, 2.9466552734375, 3.12066650390625, 3.294677734375, 3.46868896484375, 3.6427001953125, 3.81671142578125, 3.99072265625, 4.16473388671875, 4.3387451171875, 4.51275634765625, 4.686767578125, 4.86077880859375, 5.0347900390625, 5.20880126953125, 5.3828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 1.0, 8.0, 9.0, 20.0, 16.0, 15.0, 41.0, 70.0, 85.0, 140.0, 253.0, 407.0, 736.0, 1382.0, 2538.0, 5124.0, 10260.0, 20471.0, 50927.0, 804343.0, 100861.0, 25546.0, 12338.0, 6128.0, 3178.0, 1643.0, 840.0, 450.0, 263.0, 167.0, 84.0, 68.0, 45.0, 24.0, 21.0, 11.0, 9.0, 6.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.046875, -10.6741943359375, -10.301513671875, -9.9288330078125, -9.55615234375, -9.1834716796875, -8.810791015625, -8.4381103515625, -8.0654296875, -7.6927490234375, -7.320068359375, -6.9473876953125, -6.57470703125, -6.2020263671875, -5.829345703125, -5.4566650390625, -5.083984375, -4.7113037109375, -4.338623046875, -3.9659423828125, -3.59326171875, -3.2205810546875, -2.847900390625, -2.4752197265625, -2.1025390625, -1.7298583984375, -1.357177734375, -0.9844970703125, -0.61181640625, -0.2391357421875, 0.133544921875, 0.5062255859375, 0.87890625, 1.2515869140625, 1.624267578125, 1.9969482421875, 2.36962890625, 2.7423095703125, 3.114990234375, 3.4876708984375, 3.8603515625, 4.2330322265625, 4.605712890625, 4.9783935546875, 5.35107421875, 5.7237548828125, 6.096435546875, 6.4691162109375, 6.841796875, 7.2144775390625, 7.587158203125, 7.9598388671875, 8.33251953125, 8.7052001953125, 9.077880859375, 9.4505615234375, 9.8232421875, 10.1959228515625, 10.568603515625, 10.9412841796875, 11.31396484375, 11.6866455078125, 12.059326171875, 12.4320068359375, 12.8046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 4.0, 5.0, 7.0, 13.0, 11.0, 15.0, 17.0, 15.0, 20.0, 21.0, 27.0, 37.0, 38.0, 33.0, 34.0, 43.0, 39.0, 43.0, 51.0, 43.0, 38.0, 53.0, 39.0, 49.0, 37.0, 28.0, 38.0, 30.0, 18.0, 18.0, 21.0, 12.0, 22.0, 17.0, 6.0, 15.0, 8.0, 8.0, 5.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.60546875, -7.38812255859375, -7.1707763671875, -6.95343017578125, -6.736083984375, -6.51873779296875, -6.3013916015625, -6.08404541015625, -5.86669921875, -5.64935302734375, -5.4320068359375, -5.21466064453125, -4.997314453125, -4.77996826171875, -4.5626220703125, -4.34527587890625, -4.1279296875, -3.91058349609375, -3.6932373046875, -3.47589111328125, -3.258544921875, -3.04119873046875, -2.8238525390625, -2.60650634765625, -2.38916015625, -2.17181396484375, -1.9544677734375, -1.73712158203125, -1.519775390625, -1.30242919921875, -1.0850830078125, -0.86773681640625, -0.650390625, -0.43304443359375, -0.2156982421875, 0.00164794921875, 0.218994140625, 0.43634033203125, 0.6536865234375, 0.87103271484375, 1.08837890625, 1.30572509765625, 1.5230712890625, 1.74041748046875, 1.957763671875, 2.17510986328125, 2.3924560546875, 2.60980224609375, 2.8271484375, 3.04449462890625, 3.2618408203125, 3.47918701171875, 3.696533203125, 3.91387939453125, 4.1312255859375, 4.34857177734375, 4.56591796875, 4.78326416015625, 5.0006103515625, 5.21795654296875, 5.435302734375, 5.65264892578125, 5.8699951171875, 6.08734130859375, 6.3046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 13.0, 11.0, 16.0, 16.0, 17.0, 53.0, 62.0, 102.0, 127.0, 196.0, 320.0, 513.0, 793.0, 1131.0, 1903.0, 3323.0, 5615.0, 10941.0, 23288.0, 88599.0, 749686.0, 109315.0, 25587.0, 11806.0, 6080.0, 3441.0, 2067.0, 1266.0, 821.0, 459.0, 334.0, 226.0, 143.0, 84.0, 77.0, 35.0, 30.0, 20.0, 19.0, 14.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.72967529296875, -4.5843505859375, -4.43902587890625, -4.293701171875, -4.14837646484375, -4.0030517578125, -3.85772705078125, -3.71240234375, -3.56707763671875, -3.4217529296875, -3.27642822265625, -3.131103515625, -2.98577880859375, -2.8404541015625, -2.69512939453125, -2.5498046875, -2.40447998046875, -2.2591552734375, -2.11383056640625, -1.968505859375, -1.82318115234375, -1.6778564453125, -1.53253173828125, -1.38720703125, -1.24188232421875, -1.0965576171875, -0.95123291015625, -0.805908203125, -0.66058349609375, -0.5152587890625, -0.36993408203125, -0.224609375, -0.07928466796875, 0.0660400390625, 0.21136474609375, 0.356689453125, 0.50201416015625, 0.6473388671875, 0.79266357421875, 0.93798828125, 1.08331298828125, 1.2286376953125, 1.37396240234375, 1.519287109375, 1.66461181640625, 1.8099365234375, 1.95526123046875, 2.1005859375, 2.24591064453125, 2.3912353515625, 2.53656005859375, 2.681884765625, 2.82720947265625, 2.9725341796875, 3.11785888671875, 3.26318359375, 3.40850830078125, 3.5538330078125, 3.69915771484375, 3.844482421875, 3.98980712890625, 4.1351318359375, 4.28045654296875, 4.42578125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 4.0, 9.0, 10.0, 15.0, 19.0, 28.0, 43.0, 45.0, 63.0, 66.0, 84.0, 84.0, 100.0, 77.0, 75.0, 57.0, 54.0, 34.0, 26.0, 20.0, 15.0, 10.0, 14.0, 10.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013523101806640625, -0.0013165324926376343, -0.001280754804611206, -0.0012449771165847778, -0.0012091994285583496, -0.0011734217405319214, -0.0011376440525054932, -0.001101866364479065, -0.0010660886764526367, -0.0010303109884262085, -0.0009945333003997803, -0.000958755612373352, -0.0009229779243469238, -0.0008872002363204956, -0.0008514225482940674, -0.0008156448602676392, -0.0007798671722412109, -0.0007440894842147827, -0.0007083117961883545, -0.0006725341081619263, -0.000636756420135498, -0.0006009787321090698, -0.0005652010440826416, -0.0005294233560562134, -0.0004936456680297852, -0.00045786798000335693, -0.0004220902919769287, -0.0003863126039505005, -0.00035053491592407227, -0.00031475722789764404, -0.0002789795398712158, -0.0002432018518447876, -0.00020742416381835938, -0.00017164647579193115, -0.00013586878776550293, -0.00010009109973907471, -6.431341171264648e-05, -2.8535723686218262e-05, 7.241964340209961e-06, 4.3019652366638184e-05, 7.87973403930664e-05, 0.00011457502841949463, 0.00015035271644592285, 0.00018613040447235107, 0.0002219080924987793, 0.0002576857805252075, 0.00029346346855163574, 0.00032924115657806396, 0.0003650188446044922, 0.0004007965326309204, 0.00043657422065734863, 0.00047235190868377686, 0.0005081295967102051, 0.0005439072847366333, 0.0005796849727630615, 0.0006154626607894897, 0.000651240348815918, 0.0006870180368423462, 0.0007227957248687744, 0.0007585734128952026, 0.0007943511009216309, 0.0008301287889480591, 0.0008659064769744873, 0.0009016841650009155, 0.0009374618530273438]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 13.0, 17.0, 16.0, 19.0, 32.0, 66.0, 78.0, 113.0, 154.0, 248.0, 392.0, 562.0, 774.0, 1216.0, 1707.0, 2429.0, 3580.0, 5615.0, 8062.0, 12236.0, 18065.0, 26600.0, 40010.0, 59670.0, 87565.0, 121247.0, 147039.0, 144720.0, 115309.0, 81875.0, 55605.0, 37204.0, 24828.0, 16695.0, 11369.0, 7591.0, 4994.0, 3500.0, 2299.0, 1557.0, 1092.0, 779.0, 498.0, 347.0, 230.0, 175.0, 112.0, 86.0, 61.0, 29.0, 23.0, 26.0, 12.0, 7.0, 4.0, 2.0, 1.0, 3.0], "bins": [-1.1474609375, -1.1125946044921875, -1.077728271484375, -1.0428619384765625, -1.00799560546875, -0.9731292724609375, -0.938262939453125, -0.9033966064453125, -0.8685302734375, -0.8336639404296875, -0.798797607421875, -0.7639312744140625, -0.72906494140625, -0.6941986083984375, -0.659332275390625, -0.6244659423828125, -0.589599609375, -0.5547332763671875, -0.519866943359375, -0.4850006103515625, -0.45013427734375, -0.4152679443359375, -0.380401611328125, -0.3455352783203125, -0.3106689453125, -0.2758026123046875, -0.240936279296875, -0.2060699462890625, -0.17120361328125, -0.1363372802734375, -0.101470947265625, -0.0666046142578125, -0.03173828125, 0.0031280517578125, 0.037994384765625, 0.0728607177734375, 0.10772705078125, 0.1425933837890625, 0.177459716796875, 0.2123260498046875, 0.2471923828125, 0.2820587158203125, 0.316925048828125, 0.3517913818359375, 0.38665771484375, 0.4215240478515625, 0.456390380859375, 0.4912567138671875, 0.526123046875, 0.5609893798828125, 0.595855712890625, 0.6307220458984375, 0.66558837890625, 0.7004547119140625, 0.735321044921875, 0.7701873779296875, 0.8050537109375, 0.8399200439453125, 0.874786376953125, 0.9096527099609375, 0.94451904296875, 0.9793853759765625, 1.014251708984375, 1.0491180419921875, 1.083984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 12.0, 7.0, 12.0, 19.0, 27.0, 21.0, 20.0, 23.0, 17.0, 28.0, 29.0, 23.0, 30.0, 29.0, 39.0, 29.0, 41.0, 21.0, 33.0, 21.0, 27.0, 45.0, 39.0, 30.0, 26.0, 33.0, 31.0, 27.0, 32.0, 26.0, 26.0, 32.0, 26.0, 25.0, 24.0, 19.0, 18.0, 11.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37841796875, -0.3661537170410156, -0.35388946533203125, -0.3416252136230469, -0.3293609619140625, -0.3170967102050781, -0.30483245849609375, -0.2925682067871094, -0.280303955078125, -0.2680397033691406, -0.25577545166015625, -0.24351119995117188, -0.2312469482421875, -0.21898269653320312, -0.20671844482421875, -0.19445419311523438, -0.18218994140625, -0.16992568969726562, -0.15766143798828125, -0.14539718627929688, -0.1331329345703125, -0.12086868286132812, -0.10860443115234375, -0.09634017944335938, -0.084075927734375, -0.07181167602539062, -0.05954742431640625, -0.047283172607421875, -0.0350189208984375, -0.022754669189453125, -0.01049041748046875, 0.001773834228515625, 0.0140380859375, 0.026302337646484375, 0.03856658935546875, 0.050830841064453125, 0.0630950927734375, 0.07535934448242188, 0.08762359619140625, 0.09988784790039062, 0.112152099609375, 0.12441635131835938, 0.13668060302734375, 0.14894485473632812, 0.1612091064453125, 0.17347335815429688, 0.18573760986328125, 0.19800186157226562, 0.21026611328125, 0.22253036499023438, 0.23479461669921875, 0.24705886840820312, 0.2593231201171875, 0.2715873718261719, 0.28385162353515625, 0.2961158752441406, 0.308380126953125, 0.3206443786621094, 0.33290863037109375, 0.3451728820800781, 0.3574371337890625, 0.3697013854980469, 0.38196563720703125, 0.3942298889160156, 0.406494140625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 10.0, 16.0, 13.0, 17.0, 22.0, 24.0, 28.0, 37.0, 47.0, 47.0, 52.0, 40.0, 55.0, 53.0, 55.0, 58.0, 59.0, 49.0, 40.0, 49.0, 38.0, 27.0, 30.0, 22.0, 19.0, 23.0, 11.0, 8.0, 10.0, 6.0, 1.0, 6.0, 7.0, 1.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.168818950653076, -6.947234630584717, -6.725649833679199, -6.50406551361084, -6.2824811935424805, -6.060896396636963, -5.8393120765686035, -5.617727279663086, -5.396142959594727, -5.174558639526367, -4.95297384262085, -4.73138952255249, -4.509804725646973, -4.288220405578613, -4.066636085510254, -3.8450515270233154, -3.623466968536377, -3.4018824100494385, -3.1802978515625, -2.9587135314941406, -2.737128973007202, -2.5155444145202637, -2.2939600944519043, -2.072375535964966, -1.8507909774780273, -1.6292064189910889, -1.40762197971344, -1.186037540435791, -0.9644529819488525, -0.7428684234619141, -0.5212839841842651, -0.2996995449066162, -0.07811450958251953, 0.14346998929977417, 0.36505448818206787, 0.5866389870643616, 0.8082234859466553, 1.0298080444335938, 1.2513924837112427, 1.4729769229888916, 1.69456148147583, 1.9161460399627686, 2.137730598449707, 2.3593149185180664, 2.580899477005005, 2.8024840354919434, 3.0240683555603027, 3.245652914047241, 3.4672374725341797, 3.688822031021118, 3.9104065895080566, 4.131990909576416, 4.353575706481934, 4.575160026550293, 4.796744346618652, 5.018328666687012, 5.239913463592529, 5.461497783660889, 5.683082580566406, 5.904666900634766, 6.126251220703125, 6.347836017608643, 6.569420337677002, 6.7910051345825195, 7.012589454650879]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 7.0, 7.0, 20.0, 19.0, 18.0, 32.0, 22.0, 20.0, 27.0, 37.0, 33.0, 29.0, 44.0, 50.0, 43.0, 42.0, 37.0, 48.0, 34.0, 52.0, 39.0, 39.0, 31.0, 26.0, 32.0, 24.0, 20.0, 22.0, 17.0, 20.0, 12.0, 16.0, 6.0, 10.0, 7.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0], "bins": [-6.221052646636963, -6.034298419952393, -5.847544193267822, -5.660789966583252, -5.47403621673584, -5.2872819900512695, -5.100527763366699, -4.913773536682129, -4.727019309997559, -4.540265083312988, -4.353510856628418, -4.166756629943848, -3.9800026416778564, -3.793248414993286, -3.606494426727295, -3.4197402000427246, -3.2329859733581543, -3.046231746673584, -2.8594775199890137, -2.6727235317230225, -2.485969305038452, -2.299215078353882, -2.1124610900878906, -1.9257068634033203, -1.73895263671875, -1.5521984100341797, -1.365444302558899, -1.1786901950836182, -0.9919359683990479, -0.8051818013191223, -0.6184276342391968, -0.431673526763916, -0.2449188232421875, -0.05816465616226196, 0.12858951091766357, 0.3153436779975891, 0.5020978450775146, 0.6888520121574402, 0.8756061792373657, 1.0623602867126465, 1.2491145133972168, 1.435868740081787, 1.6226228475570679, 1.8093769550323486, 1.996131181716919, 2.1828854084014893, 2.3696393966674805, 2.556393623352051, 2.743147850036621, 2.9299020767211914, 3.1166563034057617, 3.303410291671753, 3.4901645183563232, 3.6769187450408936, 3.8636727333068848, 4.050426959991455, 4.237181186676025, 4.423935413360596, 4.610689640045166, 4.797443866729736, 4.984197616577148, 5.170951843261719, 5.357706069946289, 5.544460296630859, 5.73121452331543]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 15.0, 21.0, 32.0, 41.0, 71.0, 108.0, 143.0, 241.0, 405.0, 607.0, 973.0, 1403.0, 2354.0, 3747.0, 5646.0, 9057.0, 14233.0, 22238.0, 34429.0, 51503.0, 73941.0, 100241.0, 122111.0, 132706.0, 125408.0, 105404.0, 79521.0, 56552.0, 37613.0, 24625.0, 15734.0, 10040.0, 6431.0, 4062.0, 2435.0, 1616.0, 1008.0, 610.0, 420.0, 280.0, 184.0, 127.0, 69.0, 56.0, 39.0, 12.0, 15.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.00390625, -4.8504638671875, -4.697021484375, -4.5435791015625, -4.39013671875, -4.2366943359375, -4.083251953125, -3.9298095703125, -3.7763671875, -3.6229248046875, -3.469482421875, -3.3160400390625, -3.16259765625, -3.0091552734375, -2.855712890625, -2.7022705078125, -2.548828125, -2.3953857421875, -2.241943359375, -2.0885009765625, -1.93505859375, -1.7816162109375, -1.628173828125, -1.4747314453125, -1.3212890625, -1.1678466796875, -1.014404296875, -0.8609619140625, -0.70751953125, -0.5540771484375, -0.400634765625, -0.2471923828125, -0.09375, 0.0596923828125, 0.213134765625, 0.3665771484375, 0.52001953125, 0.6734619140625, 0.826904296875, 0.9803466796875, 1.1337890625, 1.2872314453125, 1.440673828125, 1.5941162109375, 1.74755859375, 1.9010009765625, 2.054443359375, 2.2078857421875, 2.361328125, 2.5147705078125, 2.668212890625, 2.8216552734375, 2.97509765625, 3.1285400390625, 3.281982421875, 3.4354248046875, 3.5888671875, 3.7423095703125, 3.895751953125, 4.0491943359375, 4.20263671875, 4.3560791015625, 4.509521484375, 4.6629638671875, 4.81640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 7.0, 6.0, 6.0, 15.0, 13.0, 28.0, 17.0, 20.0, 31.0, 22.0, 34.0, 32.0, 25.0, 40.0, 38.0, 45.0, 47.0, 42.0, 44.0, 53.0, 42.0, 44.0, 47.0, 23.0, 32.0, 31.0, 26.0, 33.0, 22.0, 18.0, 17.0, 16.0, 23.0, 12.0, 12.0, 4.0, 7.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.98828125, -5.80322265625, -5.6181640625, -5.43310546875, -5.248046875, -5.06298828125, -4.8779296875, -4.69287109375, -4.5078125, -4.32275390625, -4.1376953125, -3.95263671875, -3.767578125, -3.58251953125, -3.3974609375, -3.21240234375, -3.02734375, -2.84228515625, -2.6572265625, -2.47216796875, -2.287109375, -2.10205078125, -1.9169921875, -1.73193359375, -1.546875, -1.36181640625, -1.1767578125, -0.99169921875, -0.806640625, -0.62158203125, -0.4365234375, -0.25146484375, -0.06640625, 0.11865234375, 0.3037109375, 0.48876953125, 0.673828125, 0.85888671875, 1.0439453125, 1.22900390625, 1.4140625, 1.59912109375, 1.7841796875, 1.96923828125, 2.154296875, 2.33935546875, 2.5244140625, 2.70947265625, 2.89453125, 3.07958984375, 3.2646484375, 3.44970703125, 3.634765625, 3.81982421875, 4.0048828125, 4.18994140625, 4.375, 4.56005859375, 4.7451171875, 4.93017578125, 5.115234375, 5.30029296875, 5.4853515625, 5.67041015625, 5.85546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 27.0, 25.0, 40.0, 64.0, 87.0, 121.0, 196.0, 353.0, 453.0, 726.0, 1065.0, 1677.0, 2509.0, 3942.0, 5898.0, 9248.0, 14347.0, 22337.0, 34874.0, 54050.0, 80631.0, 114707.0, 142882.0, 149409.0, 128375.0, 95561.0, 65228.0, 42709.0, 27162.0, 17500.0, 11263.0, 7318.0, 4800.0, 3147.0, 1940.0, 1280.0, 844.0, 569.0, 395.0, 256.0, 187.0, 129.0, 62.0, 51.0, 43.0, 27.0, 13.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0], "bins": [-7.95703125, -7.72454833984375, -7.4920654296875, -7.25958251953125, -7.027099609375, -6.79461669921875, -6.5621337890625, -6.32965087890625, -6.09716796875, -5.86468505859375, -5.6322021484375, -5.39971923828125, -5.167236328125, -4.93475341796875, -4.7022705078125, -4.46978759765625, -4.2373046875, -4.00482177734375, -3.7723388671875, -3.53985595703125, -3.307373046875, -3.07489013671875, -2.8424072265625, -2.60992431640625, -2.37744140625, -2.14495849609375, -1.9124755859375, -1.67999267578125, -1.447509765625, -1.21502685546875, -0.9825439453125, -0.75006103515625, -0.517578125, -0.28509521484375, -0.0526123046875, 0.17987060546875, 0.412353515625, 0.64483642578125, 0.8773193359375, 1.10980224609375, 1.34228515625, 1.57476806640625, 1.8072509765625, 2.03973388671875, 2.272216796875, 2.50469970703125, 2.7371826171875, 2.96966552734375, 3.2021484375, 3.43463134765625, 3.6671142578125, 3.89959716796875, 4.132080078125, 4.36456298828125, 4.5970458984375, 4.82952880859375, 5.06201171875, 5.29449462890625, 5.5269775390625, 5.75946044921875, 5.991943359375, 6.22442626953125, 6.4569091796875, 6.68939208984375, 6.921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 6.0, 16.0, 10.0, 21.0, 23.0, 19.0, 14.0, 30.0, 20.0, 25.0, 29.0, 37.0, 39.0, 30.0, 33.0, 36.0, 40.0, 44.0, 49.0, 40.0, 44.0, 45.0, 34.0, 28.0, 32.0, 28.0, 24.0, 24.0, 30.0, 23.0, 15.0, 17.0, 6.0, 7.0, 15.0, 8.0, 8.0, 5.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-4.7265625, -4.5882568359375, -4.449951171875, -4.3116455078125, -4.17333984375, -4.0350341796875, -3.896728515625, -3.7584228515625, -3.6201171875, -3.4818115234375, -3.343505859375, -3.2052001953125, -3.06689453125, -2.9285888671875, -2.790283203125, -2.6519775390625, -2.513671875, -2.3753662109375, -2.237060546875, -2.0987548828125, -1.96044921875, -1.8221435546875, -1.683837890625, -1.5455322265625, -1.4072265625, -1.2689208984375, -1.130615234375, -0.9923095703125, -0.85400390625, -0.7156982421875, -0.577392578125, -0.4390869140625, -0.30078125, -0.1624755859375, -0.024169921875, 0.1141357421875, 0.25244140625, 0.3907470703125, 0.529052734375, 0.6673583984375, 0.8056640625, 0.9439697265625, 1.082275390625, 1.2205810546875, 1.35888671875, 1.4971923828125, 1.635498046875, 1.7738037109375, 1.912109375, 2.0504150390625, 2.188720703125, 2.3270263671875, 2.46533203125, 2.6036376953125, 2.741943359375, 2.8802490234375, 3.0185546875, 3.1568603515625, 3.295166015625, 3.4334716796875, 3.57177734375, 3.7100830078125, 3.848388671875, 3.9866943359375, 4.125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 10.0, 14.0, 14.0, 19.0, 36.0, 60.0, 86.0, 121.0, 188.0, 275.0, 435.0, 676.0, 1081.0, 1691.0, 2814.0, 4563.0, 8037.0, 14256.0, 27831.0, 59671.0, 162481.0, 404062.0, 215152.0, 73317.0, 32434.0, 16443.0, 9163.0, 5198.0, 3063.0, 1909.0, 1223.0, 742.0, 497.0, 310.0, 234.0, 153.0, 106.0, 56.0, 51.0, 23.0, 19.0, 12.0, 8.0, 3.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.7734375, -11.44287109375, -11.1123046875, -10.78173828125, -10.451171875, -10.12060546875, -9.7900390625, -9.45947265625, -9.12890625, -8.79833984375, -8.4677734375, -8.13720703125, -7.806640625, -7.47607421875, -7.1455078125, -6.81494140625, -6.484375, -6.15380859375, -5.8232421875, -5.49267578125, -5.162109375, -4.83154296875, -4.5009765625, -4.17041015625, -3.83984375, -3.50927734375, -3.1787109375, -2.84814453125, -2.517578125, -2.18701171875, -1.8564453125, -1.52587890625, -1.1953125, -0.86474609375, -0.5341796875, -0.20361328125, 0.126953125, 0.45751953125, 0.7880859375, 1.11865234375, 1.44921875, 1.77978515625, 2.1103515625, 2.44091796875, 2.771484375, 3.10205078125, 3.4326171875, 3.76318359375, 4.09375, 4.42431640625, 4.7548828125, 5.08544921875, 5.416015625, 5.74658203125, 6.0771484375, 6.40771484375, 6.73828125, 7.06884765625, 7.3994140625, 7.72998046875, 8.060546875, 8.39111328125, 8.7216796875, 9.05224609375, 9.3828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 10.0, 2.0, 10.0, 21.0, 27.0, 40.0, 87.0, 125.0, 233.0, 183.0, 104.0, 57.0, 28.0, 20.0, 16.0, 14.0, 4.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0020751953125, -0.002025499939918518, -0.001975804567337036, -0.0019261091947555542, -0.0018764138221740723, -0.0018267184495925903, -0.0017770230770111084, -0.0017273277044296265, -0.0016776323318481445, -0.0016279369592666626, -0.0015782415866851807, -0.0015285462141036987, -0.0014788508415222168, -0.0014291554689407349, -0.001379460096359253, -0.001329764723777771, -0.001280069351196289, -0.0012303739786148071, -0.0011806786060333252, -0.0011309832334518433, -0.0010812878608703613, -0.0010315924882888794, -0.0009818971157073975, -0.0009322017431259155, -0.0008825063705444336, -0.0008328109979629517, -0.0007831156253814697, -0.0007334202527999878, -0.0006837248802185059, -0.0006340295076370239, -0.000584334135055542, -0.0005346387624740601, -0.0004849433898925781, -0.0004352480173110962, -0.00038555264472961426, -0.0003358572721481323, -0.0002861618995666504, -0.00023646652698516846, -0.00018677115440368652, -0.0001370757818222046, -8.738040924072266e-05, -3.768503665924072e-05, 1.2010335922241211e-05, 6.170570850372314e-05, 0.00011140108108520508, 0.000161096453666687, 0.00021079182624816895, 0.0002604871988296509, 0.0003101825714111328, 0.00035987794399261475, 0.0004095733165740967, 0.0004592686891555786, 0.0005089640617370605, 0.0005586594343185425, 0.0006083548069000244, 0.0006580501794815063, 0.0007077455520629883, 0.0007574409246444702, 0.0008071362972259521, 0.0008568316698074341, 0.000906527042388916, 0.000956222414970398, 0.0010059177875518799, 0.0010556131601333618, 0.0011053085327148438]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 10.0, 16.0, 18.0, 32.0, 37.0, 47.0, 96.0, 104.0, 179.0, 267.0, 386.0, 632.0, 991.0, 1651.0, 2871.0, 5347.0, 10858.0, 23254.0, 61860.0, 233794.0, 478573.0, 146141.0, 44200.0, 17826.0, 8461.0, 4481.0, 2479.0, 1392.0, 888.0, 519.0, 343.0, 237.0, 149.0, 115.0, 77.0, 47.0, 39.0, 34.0, 24.0, 15.0, 14.0, 9.0, 11.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.7421875, -11.327880859375, -10.91357421875, -10.499267578125, -10.0849609375, -9.670654296875, -9.25634765625, -8.842041015625, -8.427734375, -8.013427734375, -7.59912109375, -7.184814453125, -6.7705078125, -6.356201171875, -5.94189453125, -5.527587890625, -5.11328125, -4.698974609375, -4.28466796875, -3.870361328125, -3.4560546875, -3.041748046875, -2.62744140625, -2.213134765625, -1.798828125, -1.384521484375, -0.97021484375, -0.555908203125, -0.1416015625, 0.272705078125, 0.68701171875, 1.101318359375, 1.515625, 1.929931640625, 2.34423828125, 2.758544921875, 3.1728515625, 3.587158203125, 4.00146484375, 4.415771484375, 4.830078125, 5.244384765625, 5.65869140625, 6.072998046875, 6.4873046875, 6.901611328125, 7.31591796875, 7.730224609375, 8.14453125, 8.558837890625, 8.97314453125, 9.387451171875, 9.8017578125, 10.216064453125, 10.63037109375, 11.044677734375, 11.458984375, 11.873291015625, 12.28759765625, 12.701904296875, 13.1162109375, 13.530517578125, 13.94482421875, 14.359130859375, 14.7734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 6.0, 9.0, 16.0, 26.0, 20.0, 29.0, 40.0, 51.0, 60.0, 75.0, 108.0, 88.0, 102.0, 80.0, 57.0, 47.0, 49.0, 31.0, 23.0, 15.0, 9.0, 14.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8828125, -3.777099609375, -3.67138671875, -3.565673828125, -3.4599609375, -3.354248046875, -3.24853515625, -3.142822265625, -3.037109375, -2.931396484375, -2.82568359375, -2.719970703125, -2.6142578125, -2.508544921875, -2.40283203125, -2.297119140625, -2.19140625, -2.085693359375, -1.97998046875, -1.874267578125, -1.7685546875, -1.662841796875, -1.55712890625, -1.451416015625, -1.345703125, -1.239990234375, -1.13427734375, -1.028564453125, -0.9228515625, -0.817138671875, -0.71142578125, -0.605712890625, -0.5, -0.394287109375, -0.28857421875, -0.182861328125, -0.0771484375, 0.028564453125, 0.13427734375, 0.239990234375, 0.345703125, 0.451416015625, 0.55712890625, 0.662841796875, 0.7685546875, 0.874267578125, 0.97998046875, 1.085693359375, 1.19140625, 1.297119140625, 1.40283203125, 1.508544921875, 1.6142578125, 1.719970703125, 1.82568359375, 1.931396484375, 2.037109375, 2.142822265625, 2.24853515625, 2.354248046875, 2.4599609375, 2.565673828125, 2.67138671875, 2.777099609375, 2.8828125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 12.0, 7.0, 19.0, 17.0, 27.0, 30.0, 35.0, 33.0, 40.0, 58.0, 57.0, 49.0, 64.0, 62.0, 59.0, 53.0, 43.0, 49.0, 40.0, 45.0, 33.0, 26.0, 15.0, 20.0, 21.0, 18.0, 16.0, 10.0, 10.0, 10.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.045910835266113, -5.805994033813477, -5.566076755523682, -5.326159477233887, -5.08624267578125, -4.846325874328613, -4.606408596038818, -4.366491317749023, -4.126574516296387, -3.886657476425171, -3.646740436553955, -3.4068233966827393, -3.1669063568115234, -2.9269893169403076, -2.687072277069092, -2.447155237197876, -2.20723819732666, -1.9673211574554443, -1.7274041175842285, -1.4874870777130127, -1.2475700378417969, -1.007652997970581, -0.7677359580993652, -0.5278189182281494, -0.2879018783569336, -0.04798483848571777, 0.19193220138549805, 0.43184924125671387, 0.6717662811279297, 0.9116833209991455, 1.1516003608703613, 1.3915174007415771, 1.631434440612793, 1.8713514804840088, 2.1112685203552246, 2.3511855602264404, 2.5911026000976562, 2.831019639968872, 3.070936679840088, 3.3108537197113037, 3.5507707595825195, 3.7906877994537354, 4.030604839324951, 4.270522117614746, 4.510438919067383, 4.7503557205200195, 4.9902729988098145, 5.230190277099609, 5.470107078552246, 5.710023880004883, 5.949941158294678, 6.189858436584473, 6.429775238037109, 6.669692039489746, 6.909609317779541, 7.149526596069336, 7.389443397521973, 7.629360198974609, 7.869277477264404, 8.1091947555542, 8.349111557006836, 8.589028358459473, 8.82894515991211, 9.068862915039062, 9.3087797164917]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 7.0, 11.0, 6.0, 6.0, 14.0, 12.0, 14.0, 22.0, 26.0, 15.0, 34.0, 25.0, 37.0, 29.0, 41.0, 31.0, 48.0, 50.0, 33.0, 36.0, 41.0, 41.0, 54.0, 33.0, 45.0, 42.0, 32.0, 28.0, 25.0, 30.0, 22.0, 17.0, 17.0, 8.0, 13.0, 8.0, 11.0, 7.0, 12.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-7.696906089782715, -7.490312099456787, -7.283718585968018, -7.07712459564209, -6.870530605316162, -6.663936614990234, -6.457343101501465, -6.250749111175537, -6.044155120849609, -5.837561130523682, -5.630967617034912, -5.424373626708984, -5.217779636383057, -5.011185646057129, -4.804592132568359, -4.597998142242432, -4.391404151916504, -4.184810161590576, -3.9782164096832275, -3.771622657775879, -3.565028667449951, -3.3584349155426025, -3.151841163635254, -2.945247173309326, -2.7386536598205566, -2.532059907913208, -2.3254659175872803, -2.1188721656799316, -1.912278175354004, -1.7056844234466553, -1.499090552330017, -1.292496681213379, -1.0859026908874512, -0.879308819770813, -0.6727149486541748, -0.4661211371421814, -0.2595272660255432, -0.052933454513549805, 0.15366041660308838, 0.36025428771972656, 0.5668481588363647, 0.7734420299530029, 0.9800359010696411, 1.1866297721862793, 1.393223524093628, 1.5998173952102661, 1.8064112663269043, 2.013005256652832, 2.2195990085601807, 2.4261927604675293, 2.632786750793457, 2.8393805027008057, 3.0459744930267334, 3.252568244934082, 3.4591622352600098, 3.6657559871673584, 3.872349739074707, 4.078943729400635, 4.285537242889404, 4.492131233215332, 4.69872522354126, 4.9053192138671875, 5.111912727355957, 5.318506717681885, 5.5251007080078125]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 7.0, 4.0, 6.0, 6.0, 18.0, 20.0, 28.0, 69.0, 84.0, 105.0, 147.0, 219.0, 342.0, 536.0, 757.0, 1122.0, 1734.0, 2715.0, 4274.0, 6865.0, 11499.0, 20078.0, 35634.0, 67491.0, 131655.0, 261338.0, 479980.0, 737032.0, 838654.0, 685196.0, 427068.0, 227312.0, 115120.0, 59365.0, 32126.0, 17947.0, 10446.0, 6228.0, 3822.0, 2543.0, 1512.0, 1041.0, 665.0, 477.0, 301.0, 232.0, 153.0, 107.0, 56.0, 47.0, 40.0, 23.0, 22.0, 11.0, 5.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0], "bins": [-5.83203125, -5.646240234375, -5.46044921875, -5.274658203125, -5.0888671875, -4.903076171875, -4.71728515625, -4.531494140625, -4.345703125, -4.159912109375, -3.97412109375, -3.788330078125, -3.6025390625, -3.416748046875, -3.23095703125, -3.045166015625, -2.859375, -2.673583984375, -2.48779296875, -2.302001953125, -2.1162109375, -1.930419921875, -1.74462890625, -1.558837890625, -1.373046875, -1.187255859375, -1.00146484375, -0.815673828125, -0.6298828125, -0.444091796875, -0.25830078125, -0.072509765625, 0.11328125, 0.299072265625, 0.48486328125, 0.670654296875, 0.8564453125, 1.042236328125, 1.22802734375, 1.413818359375, 1.599609375, 1.785400390625, 1.97119140625, 2.156982421875, 2.3427734375, 2.528564453125, 2.71435546875, 2.900146484375, 3.0859375, 3.271728515625, 3.45751953125, 3.643310546875, 3.8291015625, 4.014892578125, 4.20068359375, 4.386474609375, 4.572265625, 4.758056640625, 4.94384765625, 5.129638671875, 5.3154296875, 5.501220703125, 5.68701171875, 5.872802734375, 6.05859375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 3.0, 6.0, 7.0, 7.0, 12.0, 10.0, 17.0, 15.0, 17.0, 19.0, 28.0, 31.0, 33.0, 35.0, 18.0, 32.0, 38.0, 52.0, 42.0, 39.0, 39.0, 38.0, 34.0, 35.0, 50.0, 32.0, 44.0, 31.0, 26.0, 24.0, 26.0, 21.0, 27.0, 10.0, 8.0, 17.0, 6.0, 15.0, 11.0, 5.0, 8.0, 7.0, 1.0, 3.0, 2.0, 6.0, 1.0, 2.0], "bins": [-5.9296875, -5.76641845703125, -5.6031494140625, -5.43988037109375, -5.276611328125, -5.11334228515625, -4.9500732421875, -4.78680419921875, -4.62353515625, -4.46026611328125, -4.2969970703125, -4.13372802734375, -3.970458984375, -3.80718994140625, -3.6439208984375, -3.48065185546875, -3.3173828125, -3.15411376953125, -2.9908447265625, -2.82757568359375, -2.664306640625, -2.50103759765625, -2.3377685546875, -2.17449951171875, -2.01123046875, -1.84796142578125, -1.6846923828125, -1.52142333984375, -1.358154296875, -1.19488525390625, -1.0316162109375, -0.86834716796875, -0.705078125, -0.54180908203125, -0.3785400390625, -0.21527099609375, -0.052001953125, 0.11126708984375, 0.2745361328125, 0.43780517578125, 0.60107421875, 0.76434326171875, 0.9276123046875, 1.09088134765625, 1.254150390625, 1.41741943359375, 1.5806884765625, 1.74395751953125, 1.9072265625, 2.07049560546875, 2.2337646484375, 2.39703369140625, 2.560302734375, 2.72357177734375, 2.8868408203125, 3.05010986328125, 3.21337890625, 3.37664794921875, 3.5399169921875, 3.70318603515625, 3.866455078125, 4.02972412109375, 4.1929931640625, 4.35626220703125, 4.51953125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 5.0, 7.0, 10.0, 25.0, 46.0, 38.0, 64.0, 124.0, 146.0, 197.0, 267.0, 392.0, 609.0, 940.0, 1518.0, 2372.0, 4011.0, 6701.0, 11348.0, 20199.0, 37409.0, 70558.0, 136144.0, 257878.0, 462173.0, 720498.0, 845719.0, 685647.0, 426926.0, 235242.0, 123200.0, 64363.0, 34237.0, 18489.0, 10397.0, 6163.0, 3754.0, 2252.0, 1463.0, 942.0, 602.0, 385.0, 270.0, 161.0, 119.0, 95.0, 65.0, 38.0, 25.0, 21.0, 12.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.90234375, -6.66778564453125, -6.4332275390625, -6.19866943359375, -5.964111328125, -5.72955322265625, -5.4949951171875, -5.26043701171875, -5.02587890625, -4.79132080078125, -4.5567626953125, -4.32220458984375, -4.087646484375, -3.85308837890625, -3.6185302734375, -3.38397216796875, -3.1494140625, -2.91485595703125, -2.6802978515625, -2.44573974609375, -2.211181640625, -1.97662353515625, -1.7420654296875, -1.50750732421875, -1.27294921875, -1.03839111328125, -0.8038330078125, -0.56927490234375, -0.334716796875, -0.10015869140625, 0.1343994140625, 0.36895751953125, 0.603515625, 0.83807373046875, 1.0726318359375, 1.30718994140625, 1.541748046875, 1.77630615234375, 2.0108642578125, 2.24542236328125, 2.47998046875, 2.71453857421875, 2.9490966796875, 3.18365478515625, 3.418212890625, 3.65277099609375, 3.8873291015625, 4.12188720703125, 4.3564453125, 4.59100341796875, 4.8255615234375, 5.06011962890625, 5.294677734375, 5.52923583984375, 5.7637939453125, 5.99835205078125, 6.23291015625, 6.46746826171875, 6.7020263671875, 6.93658447265625, 7.171142578125, 7.40570068359375, 7.6402587890625, 7.87481689453125, 8.109375]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 10.0, 8.0, 8.0, 17.0, 22.0, 21.0, 29.0, 42.0, 47.0, 54.0, 74.0, 91.0, 100.0, 131.0, 160.0, 186.0, 202.0, 220.0, 264.0, 266.0, 264.0, 276.0, 224.0, 263.0, 193.0, 165.0, 144.0, 132.0, 88.0, 65.0, 87.0, 48.0, 46.0, 27.0, 22.0, 20.0, 11.0, 7.0, 11.0, 8.0, 4.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.578125, -2.491973876953125, -2.40582275390625, -2.319671630859375, -2.2335205078125, -2.147369384765625, -2.06121826171875, -1.975067138671875, -1.888916015625, -1.802764892578125, -1.71661376953125, -1.630462646484375, -1.5443115234375, -1.458160400390625, -1.37200927734375, -1.285858154296875, -1.19970703125, -1.113555908203125, -1.02740478515625, -0.941253662109375, -0.8551025390625, -0.768951416015625, -0.68280029296875, -0.596649169921875, -0.510498046875, -0.424346923828125, -0.33819580078125, -0.252044677734375, -0.1658935546875, -0.079742431640625, 0.00640869140625, 0.092559814453125, 0.1787109375, 0.264862060546875, 0.35101318359375, 0.437164306640625, 0.5233154296875, 0.609466552734375, 0.69561767578125, 0.781768798828125, 0.867919921875, 0.954071044921875, 1.04022216796875, 1.126373291015625, 1.2125244140625, 1.298675537109375, 1.38482666015625, 1.470977783203125, 1.55712890625, 1.643280029296875, 1.72943115234375, 1.815582275390625, 1.9017333984375, 1.987884521484375, 2.07403564453125, 2.160186767578125, 2.246337890625, 2.332489013671875, 2.41864013671875, 2.504791259765625, 2.5909423828125, 2.677093505859375, 2.76324462890625, 2.849395751953125, 2.935546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 10.0, 12.0, 17.0, 19.0, 13.0, 30.0, 17.0, 38.0, 23.0, 39.0, 44.0, 51.0, 58.0, 49.0, 52.0, 54.0, 52.0, 56.0, 51.0, 44.0, 42.0, 27.0, 24.0, 41.0, 15.0, 15.0, 24.0, 14.0, 10.0, 10.0, 12.0, 6.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.858084201812744, -6.623102188110352, -6.388120174407959, -6.153138160705566, -5.918155670166016, -5.683173656463623, -5.4481916427612305, -5.213209629058838, -4.978227615356445, -4.743245601654053, -4.50826358795166, -4.273281097412109, -4.038299083709717, -3.803317070007324, -3.5683350563049316, -3.333353042602539, -3.0983705520629883, -2.8633885383605957, -2.628406286239624, -2.3934242725372314, -2.1584420204162598, -1.9234600067138672, -1.6884779930114746, -1.4534958600997925, -1.2185137271881104, -0.9835315942764282, -0.7485495209693909, -0.5135674476623535, -0.2785853147506714, -0.04360318183898926, 0.19137883186340332, 0.42636096477508545, 0.6613426208496094, 0.8963247537612915, 1.1313068866729736, 1.3662889003753662, 1.6012710332870483, 1.8362531661987305, 2.071235179901123, 2.3062171936035156, 2.5411994457244873, 2.77618145942688, 3.0111637115478516, 3.246145725250244, 3.4811277389526367, 3.7161099910736084, 3.951092004776001, 4.186074256896973, 4.421056270599365, 4.656038284301758, 4.89102029800415, 5.126002311706543, 5.360984802246094, 5.595966815948486, 5.830948829650879, 6.0659308433532715, 6.300912857055664, 6.535894870758057, 6.770876884460449, 7.005859375, 7.240841388702393, 7.475823402404785, 7.710805416107178, 7.94578742980957, 8.180769920349121]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 1.0, 6.0, 5.0, 7.0, 13.0, 7.0, 9.0, 9.0, 17.0, 16.0, 18.0, 12.0, 28.0, 25.0, 29.0, 29.0, 23.0, 23.0, 31.0, 30.0, 29.0, 44.0, 42.0, 37.0, 39.0, 43.0, 30.0, 33.0, 40.0, 29.0, 36.0, 29.0, 33.0, 25.0, 24.0, 26.0, 23.0, 10.0, 11.0, 15.0, 13.0, 9.0, 12.0, 2.0, 4.0, 7.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.9501051902771, -5.77345085144043, -5.596796035766602, -5.420141696929932, -5.243487358093262, -5.066833019256592, -4.890178680419922, -4.713523864746094, -4.536869525909424, -4.360215187072754, -4.183560371398926, -4.006906032562256, -3.830251693725586, -3.653597354888916, -3.476942777633667, -3.300288200378418, -3.123633861541748, -2.946979522705078, -2.770324945449829, -2.59367036819458, -2.41701602935791, -2.2403616905212402, -2.063707113265991, -1.8870526552200317, -1.7103981971740723, -1.5337437391281128, -1.3570892810821533, -1.1804348230361938, -1.0037803649902344, -0.8271259069442749, -0.6504714488983154, -0.47381699085235596, -0.2971630096435547, -0.12050855159759521, 0.05614590644836426, 0.23280036449432373, 0.4094548225402832, 0.5861092805862427, 0.7627637386322021, 0.9394181966781616, 1.116072654724121, 1.2927271127700806, 1.46938157081604, 1.6460360288619995, 1.822690486907959, 1.9993449449539185, 2.175999402999878, 2.352653980255127, 2.529308319091797, 2.705962657928467, 2.882617235183716, 3.059271812438965, 3.2359261512756348, 3.4125804901123047, 3.5892350673675537, 3.7658896446228027, 3.9425439834594727, 4.119198322296143, 4.2958526611328125, 4.472507476806641, 4.6491618156433105, 4.8258161544799805, 5.002470970153809, 5.1791253089904785, 5.355779647827148]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 8.0, 16.0, 25.0, 28.0, 43.0, 68.0, 101.0, 197.0, 311.0, 454.0, 699.0, 1128.0, 1740.0, 2700.0, 4382.0, 6823.0, 11030.0, 17563.0, 28152.0, 44335.0, 67909.0, 99426.0, 132320.0, 150621.0, 142032.0, 112872.0, 79741.0, 53033.0, 33860.0, 21120.0, 13129.0, 8219.0, 5247.0, 3375.0, 2094.0, 1367.0, 894.0, 572.0, 340.0, 207.0, 131.0, 108.0, 44.0, 33.0, 18.0, 17.0, 4.0, 9.0, 0.0, 6.0, 4.0, 2.0, 0.0, 2.0], "bins": [-4.19921875, -4.074615478515625, -3.95001220703125, -3.825408935546875, -3.7008056640625, -3.576202392578125, -3.45159912109375, -3.326995849609375, -3.202392578125, -3.077789306640625, -2.95318603515625, -2.828582763671875, -2.7039794921875, -2.579376220703125, -2.45477294921875, -2.330169677734375, -2.20556640625, -2.080963134765625, -1.95635986328125, -1.831756591796875, -1.7071533203125, -1.582550048828125, -1.45794677734375, -1.333343505859375, -1.208740234375, -1.084136962890625, -0.95953369140625, -0.834930419921875, -0.7103271484375, -0.585723876953125, -0.46112060546875, -0.336517333984375, -0.2119140625, -0.087310791015625, 0.03729248046875, 0.161895751953125, 0.2864990234375, 0.411102294921875, 0.53570556640625, 0.660308837890625, 0.784912109375, 0.909515380859375, 1.03411865234375, 1.158721923828125, 1.2833251953125, 1.407928466796875, 1.53253173828125, 1.657135009765625, 1.78173828125, 1.906341552734375, 2.03094482421875, 2.155548095703125, 2.2801513671875, 2.404754638671875, 2.52935791015625, 2.653961181640625, 2.778564453125, 2.903167724609375, 3.02777099609375, 3.152374267578125, 3.2769775390625, 3.401580810546875, 3.52618408203125, 3.650787353515625, 3.775390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 11.0, 7.0, 9.0, 4.0, 12.0, 9.0, 17.0, 21.0, 10.0, 18.0, 29.0, 20.0, 33.0, 31.0, 14.0, 23.0, 28.0, 36.0, 42.0, 41.0, 38.0, 32.0, 41.0, 37.0, 38.0, 38.0, 34.0, 32.0, 33.0, 26.0, 32.0, 24.0, 21.0, 29.0, 19.0, 17.0, 14.0, 10.0, 9.0, 13.0, 11.0, 1.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0], "bins": [-5.92578125, -5.74896240234375, -5.5721435546875, -5.39532470703125, -5.218505859375, -5.04168701171875, -4.8648681640625, -4.68804931640625, -4.51123046875, -4.33441162109375, -4.1575927734375, -3.98077392578125, -3.803955078125, -3.62713623046875, -3.4503173828125, -3.27349853515625, -3.0966796875, -2.91986083984375, -2.7430419921875, -2.56622314453125, -2.389404296875, -2.21258544921875, -2.0357666015625, -1.85894775390625, -1.68212890625, -1.50531005859375, -1.3284912109375, -1.15167236328125, -0.974853515625, -0.79803466796875, -0.6212158203125, -0.44439697265625, -0.267578125, -0.09075927734375, 0.0860595703125, 0.26287841796875, 0.439697265625, 0.61651611328125, 0.7933349609375, 0.97015380859375, 1.14697265625, 1.32379150390625, 1.5006103515625, 1.67742919921875, 1.854248046875, 2.03106689453125, 2.2078857421875, 2.38470458984375, 2.5615234375, 2.73834228515625, 2.9151611328125, 3.09197998046875, 3.268798828125, 3.44561767578125, 3.6224365234375, 3.79925537109375, 3.97607421875, 4.15289306640625, 4.3297119140625, 4.50653076171875, 4.683349609375, 4.86016845703125, 5.0369873046875, 5.21380615234375, 5.390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 2.0, 9.0, 9.0, 28.0, 28.0, 47.0, 65.0, 84.0, 148.0, 225.0, 331.0, 487.0, 796.0, 1201.0, 1888.0, 3168.0, 5061.0, 8406.0, 14220.0, 26179.0, 108892.0, 741320.0, 78202.0, 24015.0, 13331.0, 7812.0, 4630.0, 2902.0, 1808.0, 1155.0, 711.0, 451.0, 316.0, 206.0, 126.0, 101.0, 68.0, 32.0, 26.0, 13.0, 16.0, 13.0, 6.0, 5.0, 1.0, 2.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.796875, -8.5078125, -8.21875, -7.9296875, -7.640625, -7.3515625, -7.0625, -6.7734375, -6.484375, -6.1953125, -5.90625, -5.6171875, -5.328125, -5.0390625, -4.75, -4.4609375, -4.171875, -3.8828125, -3.59375, -3.3046875, -3.015625, -2.7265625, -2.4375, -2.1484375, -1.859375, -1.5703125, -1.28125, -0.9921875, -0.703125, -0.4140625, -0.125, 0.1640625, 0.453125, 0.7421875, 1.03125, 1.3203125, 1.609375, 1.8984375, 2.1875, 2.4765625, 2.765625, 3.0546875, 3.34375, 3.6328125, 3.921875, 4.2109375, 4.5, 4.7890625, 5.078125, 5.3671875, 5.65625, 5.9453125, 6.234375, 6.5234375, 6.8125, 7.1015625, 7.390625, 7.6796875, 7.96875, 8.2578125, 8.546875, 8.8359375, 9.125, 9.4140625, 9.703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 6.0, 6.0, 7.0, 9.0, 11.0, 12.0, 15.0, 19.0, 26.0, 28.0, 18.0, 26.0, 37.0, 38.0, 48.0, 27.0, 39.0, 35.0, 47.0, 38.0, 38.0, 39.0, 52.0, 37.0, 35.0, 52.0, 38.0, 37.0, 28.0, 26.0, 26.0, 15.0, 14.0, 8.0, 13.0, 11.0, 8.0, 10.0, 6.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69140625, -7.46441650390625, -7.2374267578125, -7.01043701171875, -6.783447265625, -6.55645751953125, -6.3294677734375, -6.10247802734375, -5.87548828125, -5.64849853515625, -5.4215087890625, -5.19451904296875, -4.967529296875, -4.74053955078125, -4.5135498046875, -4.28656005859375, -4.0595703125, -3.83258056640625, -3.6055908203125, -3.37860107421875, -3.151611328125, -2.92462158203125, -2.6976318359375, -2.47064208984375, -2.24365234375, -2.01666259765625, -1.7896728515625, -1.56268310546875, -1.335693359375, -1.10870361328125, -0.8817138671875, -0.65472412109375, -0.427734375, -0.20074462890625, 0.0262451171875, 0.25323486328125, 0.480224609375, 0.70721435546875, 0.9342041015625, 1.16119384765625, 1.38818359375, 1.61517333984375, 1.8421630859375, 2.06915283203125, 2.296142578125, 2.52313232421875, 2.7501220703125, 2.97711181640625, 3.2041015625, 3.43109130859375, 3.6580810546875, 3.88507080078125, 4.112060546875, 4.33905029296875, 4.5660400390625, 4.79302978515625, 5.02001953125, 5.24700927734375, 5.4739990234375, 5.70098876953125, 5.927978515625, 6.15496826171875, 6.3819580078125, 6.60894775390625, 6.8359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 4.0, 13.0, 12.0, 13.0, 33.0, 46.0, 54.0, 95.0, 127.0, 185.0, 271.0, 391.0, 620.0, 953.0, 1489.0, 2427.0, 4075.0, 6959.0, 12641.0, 27511.0, 124697.0, 731466.0, 83276.0, 23463.0, 11260.0, 6459.0, 3664.0, 2223.0, 1415.0, 893.0, 619.0, 371.0, 262.0, 153.0, 113.0, 80.0, 67.0, 34.0, 35.0, 21.0, 15.0, 15.0, 9.0, 2.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 3.0], "bins": [-2.021484375, -1.962738037109375, -1.90399169921875, -1.845245361328125, -1.7864990234375, -1.727752685546875, -1.66900634765625, -1.610260009765625, -1.551513671875, -1.492767333984375, -1.43402099609375, -1.375274658203125, -1.3165283203125, -1.257781982421875, -1.19903564453125, -1.140289306640625, -1.08154296875, -1.022796630859375, -0.96405029296875, -0.905303955078125, -0.8465576171875, -0.787811279296875, -0.72906494140625, -0.670318603515625, -0.611572265625, -0.552825927734375, -0.49407958984375, -0.435333251953125, -0.3765869140625, -0.317840576171875, -0.25909423828125, -0.200347900390625, -0.1416015625, -0.082855224609375, -0.02410888671875, 0.034637451171875, 0.0933837890625, 0.152130126953125, 0.21087646484375, 0.269622802734375, 0.328369140625, 0.387115478515625, 0.44586181640625, 0.504608154296875, 0.5633544921875, 0.622100830078125, 0.68084716796875, 0.739593505859375, 0.79833984375, 0.857086181640625, 0.91583251953125, 0.974578857421875, 1.0333251953125, 1.092071533203125, 1.15081787109375, 1.209564208984375, 1.268310546875, 1.327056884765625, 1.38580322265625, 1.444549560546875, 1.5032958984375, 1.562042236328125, 1.62078857421875, 1.679534912109375, 1.73828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 10.0, 5.0, 10.0, 12.0, 20.0, 32.0, 45.0, 55.0, 73.0, 118.0, 128.0, 138.0, 115.0, 72.0, 38.0, 25.0, 31.0, 15.0, 18.0, 16.0, 11.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0009756088256835938, -0.0009476318955421448, -0.0009196549654006958, -0.0008916780352592468, -0.0008637011051177979, -0.0008357241749763489, -0.0008077472448348999, -0.0007797703146934509, -0.000751793384552002, -0.000723816454410553, -0.000695839524269104, -0.000667862594127655, -0.0006398856639862061, -0.0006119087338447571, -0.0005839318037033081, -0.0005559548735618591, -0.0005279779434204102, -0.0005000010132789612, -0.0004720240831375122, -0.00044404715299606323, -0.00041607022285461426, -0.0003880932927131653, -0.0003601163625717163, -0.00033213943243026733, -0.00030416250228881836, -0.0002761855721473694, -0.0002482086420059204, -0.00022023171186447144, -0.00019225478172302246, -0.00016427785158157349, -0.0001363009214401245, -0.00010832399129867554, -8.034706115722656e-05, -5.237013101577759e-05, -2.4393200874328613e-05, 3.5837292671203613e-06, 3.1560659408569336e-05, 5.953758955001831e-05, 8.751451969146729e-05, 0.00011549144983291626, 0.00014346837997436523, 0.0001714453101158142, 0.00019942224025726318, 0.00022739917039871216, 0.00025537610054016113, 0.0002833530306816101, 0.0003113299608230591, 0.00033930689096450806, 0.00036728382110595703, 0.000395260751247406, 0.000423237681388855, 0.00045121461153030396, 0.00047919154167175293, 0.0005071684718132019, 0.0005351454019546509, 0.0005631223320960999, 0.0005910992622375488, 0.0006190761923789978, 0.0006470531225204468, 0.0006750300526618958, 0.0007030069828033447, 0.0007309839129447937, 0.0007589608430862427, 0.0007869377732276917, 0.0008149147033691406]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 8.0, 15.0, 21.0, 27.0, 30.0, 54.0, 89.0, 111.0, 172.0, 221.0, 380.0, 562.0, 780.0, 1214.0, 1722.0, 2645.0, 3999.0, 5986.0, 8842.0, 13830.0, 22113.0, 35932.0, 60978.0, 101576.0, 157331.0, 190713.0, 163073.0, 107416.0, 64457.0, 38070.0, 23361.0, 14776.0, 9363.0, 6274.0, 4060.0, 2650.0, 1897.0, 1181.0, 798.0, 556.0, 384.0, 281.0, 183.0, 139.0, 83.0, 69.0, 46.0, 28.0, 17.0, 11.0, 14.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.763671875, -0.739471435546875, -0.71527099609375, -0.691070556640625, -0.6668701171875, -0.642669677734375, -0.61846923828125, -0.594268798828125, -0.570068359375, -0.545867919921875, -0.52166748046875, -0.497467041015625, -0.4732666015625, -0.449066162109375, -0.42486572265625, -0.400665283203125, -0.37646484375, -0.352264404296875, -0.32806396484375, -0.303863525390625, -0.2796630859375, -0.255462646484375, -0.23126220703125, -0.207061767578125, -0.182861328125, -0.158660888671875, -0.13446044921875, -0.110260009765625, -0.0860595703125, -0.061859130859375, -0.03765869140625, -0.013458251953125, 0.0107421875, 0.034942626953125, 0.05914306640625, 0.083343505859375, 0.1075439453125, 0.131744384765625, 0.15594482421875, 0.180145263671875, 0.204345703125, 0.228546142578125, 0.25274658203125, 0.276947021484375, 0.3011474609375, 0.325347900390625, 0.34954833984375, 0.373748779296875, 0.39794921875, 0.422149658203125, 0.44635009765625, 0.470550537109375, 0.4947509765625, 0.518951416015625, 0.54315185546875, 0.567352294921875, 0.591552734375, 0.615753173828125, 0.63995361328125, 0.664154052734375, 0.6883544921875, 0.712554931640625, 0.73675537109375, 0.760955810546875, 0.78515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 10.0, 10.0, 10.0, 18.0, 17.0, 13.0, 16.0, 22.0, 26.0, 27.0, 35.0, 43.0, 49.0, 42.0, 44.0, 50.0, 39.0, 34.0, 29.0, 43.0, 48.0, 43.0, 28.0, 43.0, 36.0, 35.0, 25.0, 24.0, 24.0, 17.0, 9.0, 12.0, 15.0, 10.0, 8.0, 11.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0], "bins": [-0.31201171875, -0.3035755157470703, -0.2951393127441406, -0.28670310974121094, -0.27826690673828125, -0.26983070373535156, -0.2613945007324219, -0.2529582977294922, -0.2445220947265625, -0.2360858917236328, -0.22764968872070312, -0.21921348571777344, -0.21077728271484375, -0.20234107971191406, -0.19390487670898438, -0.1854686737060547, -0.177032470703125, -0.1685962677001953, -0.16016006469726562, -0.15172386169433594, -0.14328765869140625, -0.13485145568847656, -0.12641525268554688, -0.11797904968261719, -0.1095428466796875, -0.10110664367675781, -0.09267044067382812, -0.08423423767089844, -0.07579803466796875, -0.06736183166503906, -0.058925628662109375, -0.05048942565917969, -0.04205322265625, -0.03361701965332031, -0.025180816650390625, -0.016744613647460938, -0.00830841064453125, 0.0001277923583984375, 0.008563995361328125, 0.017000198364257812, 0.0254364013671875, 0.03387260437011719, 0.042308807373046875, 0.05074501037597656, 0.05918121337890625, 0.06761741638183594, 0.07605361938476562, 0.08448982238769531, 0.092926025390625, 0.10136222839355469, 0.10979843139648438, 0.11823463439941406, 0.12667083740234375, 0.13510704040527344, 0.14354324340820312, 0.1519794464111328, 0.1604156494140625, 0.1688518524169922, 0.17728805541992188, 0.18572425842285156, 0.19416046142578125, 0.20259666442871094, 0.21103286743164062, 0.2194690704345703, 0.2279052734375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 1.0, 13.0, 12.0, 17.0, 17.0, 17.0, 26.0, 25.0, 33.0, 40.0, 59.0, 56.0, 58.0, 62.0, 56.0, 61.0, 53.0, 54.0, 57.0, 38.0, 46.0, 32.0, 33.0, 27.0, 14.0, 17.0, 21.0, 9.0, 13.0, 9.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.960873603820801, -6.703713893890381, -6.446554183959961, -6.189394474029541, -5.932234764099121, -5.675075054168701, -5.417915344238281, -5.1607561111450195, -4.903595924377441, -4.6464362144470215, -4.389276504516602, -4.132116794586182, -3.8749570846557617, -3.617797374725342, -3.360637903213501, -3.103478193283081, -2.8463187217712402, -2.5891590118408203, -2.3319993019104004, -2.0748395919799805, -1.81768000125885, -1.5605202913284302, -1.3033607006072998, -1.0462009906768799, -0.78904128074646, -0.53188157081604, -0.2747219204902649, -0.017562270164489746, 0.23959743976593018, 0.4967571496963501, 0.7539167404174805, 1.0110764503479004, 1.2682361602783203, 1.5253958702087402, 1.7825555801391602, 2.03971529006958, 2.296875, 2.55403470993042, 2.8111941814422607, 3.0683538913726807, 3.3255136013031006, 3.5826733112335205, 3.8398330211639404, 4.096992492675781, 4.354152202606201, 4.611311912536621, 4.868471622467041, 5.125631332397461, 5.382791042327881, 5.639950752258301, 5.897110462188721, 6.154270172119141, 6.4114298820495605, 6.6685895919799805, 6.925748825073242, 7.18290901184082, 7.440068244934082, 7.697227954864502, 7.954387664794922, 8.211546897888184, 8.468707084655762, 8.725866317749023, 8.983026504516602, 9.240185737609863, 9.497345924377441]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 8.0, 7.0, 3.0, 6.0, 7.0, 14.0, 5.0, 8.0, 23.0, 14.0, 25.0, 13.0, 23.0, 29.0, 28.0, 23.0, 39.0, 32.0, 26.0, 31.0, 33.0, 34.0, 39.0, 37.0, 29.0, 32.0, 36.0, 33.0, 51.0, 42.0, 24.0, 31.0, 23.0, 26.0, 17.0, 27.0, 24.0, 19.0, 14.0, 11.0, 8.0, 9.0, 5.0, 11.0, 5.0, 2.0, 1.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.849215984344482, -5.673767566680908, -5.498319149017334, -5.32287073135376, -5.147421836853027, -4.971973419189453, -4.796525001525879, -4.621076583862305, -4.4456281661987305, -4.270179748535156, -4.094731330871582, -3.9192826747894287, -3.7438342571258545, -3.5683858394622803, -3.392937183380127, -3.2174887657165527, -3.0420403480529785, -2.8665919303894043, -2.69114351272583, -2.5156948566436768, -2.3402464389801025, -2.1647980213165283, -1.9893494844436646, -1.8139009475708008, -1.6384525299072266, -1.4630041122436523, -1.2875555753707886, -1.1121070384979248, -0.9366586208343506, -0.7612101435661316, -0.5857616662979126, -0.41031312942504883, -0.2348642349243164, -0.05941575765609741, 0.11603271961212158, 0.2914811968803406, 0.46692967414855957, 0.6423781514167786, 0.8178266286849976, 0.9932751655578613, 1.1687235832214355, 1.3441720008850098, 1.5196205377578735, 1.6950690746307373, 1.8705174922943115, 2.0459659099578857, 2.221414566040039, 2.3968629837036133, 2.5723114013671875, 2.7477598190307617, 2.923208236694336, 3.0986568927764893, 3.2741053104400635, 3.4495537281036377, 3.625002384185791, 3.8004508018493652, 3.9758992195129395, 4.151347637176514, 4.326796054840088, 4.502244472503662, 4.6776933670043945, 4.853141784667969, 5.028590202331543, 5.204038619995117, 5.379487037658691]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 9.0, 18.0, 24.0, 38.0, 65.0, 95.0, 152.0, 238.0, 395.0, 653.0, 1041.0, 1637.0, 2653.0, 4381.0, 6946.0, 11364.0, 18929.0, 30604.0, 49191.0, 75148.0, 107365.0, 136815.0, 149610.0, 137244.0, 107941.0, 75957.0, 49549.0, 31269.0, 19216.0, 11409.0, 7025.0, 4450.0, 2689.0, 1678.0, 1010.0, 657.0, 386.0, 267.0, 145.0, 108.0, 70.0, 39.0, 27.0, 15.0, 18.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.79296875, -5.609130859375, -5.42529296875, -5.241455078125, -5.0576171875, -4.873779296875, -4.68994140625, -4.506103515625, -4.322265625, -4.138427734375, -3.95458984375, -3.770751953125, -3.5869140625, -3.403076171875, -3.21923828125, -3.035400390625, -2.8515625, -2.667724609375, -2.48388671875, -2.300048828125, -2.1162109375, -1.932373046875, -1.74853515625, -1.564697265625, -1.380859375, -1.197021484375, -1.01318359375, -0.829345703125, -0.6455078125, -0.461669921875, -0.27783203125, -0.093994140625, 0.08984375, 0.273681640625, 0.45751953125, 0.641357421875, 0.8251953125, 1.009033203125, 1.19287109375, 1.376708984375, 1.560546875, 1.744384765625, 1.92822265625, 2.112060546875, 2.2958984375, 2.479736328125, 2.66357421875, 2.847412109375, 3.03125, 3.215087890625, 3.39892578125, 3.582763671875, 3.7666015625, 3.950439453125, 4.13427734375, 4.318115234375, 4.501953125, 4.685791015625, 4.86962890625, 5.053466796875, 5.2373046875, 5.421142578125, 5.60498046875, 5.788818359375, 5.97265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 6.0, 4.0, 6.0, 11.0, 8.0, 8.0, 14.0, 10.0, 21.0, 23.0, 11.0, 14.0, 23.0, 24.0, 30.0, 27.0, 32.0, 23.0, 32.0, 39.0, 32.0, 38.0, 46.0, 35.0, 31.0, 55.0, 38.0, 38.0, 33.0, 33.0, 25.0, 38.0, 20.0, 14.0, 17.0, 19.0, 17.0, 24.0, 12.0, 10.0, 15.0, 10.0, 3.0, 6.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0], "bins": [-5.86328125, -5.69061279296875, -5.5179443359375, -5.34527587890625, -5.172607421875, -4.99993896484375, -4.8272705078125, -4.65460205078125, -4.48193359375, -4.30926513671875, -4.1365966796875, -3.96392822265625, -3.791259765625, -3.61859130859375, -3.4459228515625, -3.27325439453125, -3.1005859375, -2.92791748046875, -2.7552490234375, -2.58258056640625, -2.409912109375, -2.23724365234375, -2.0645751953125, -1.89190673828125, -1.71923828125, -1.54656982421875, -1.3739013671875, -1.20123291015625, -1.028564453125, -0.85589599609375, -0.6832275390625, -0.51055908203125, -0.337890625, -0.16522216796875, 0.0074462890625, 0.18011474609375, 0.352783203125, 0.52545166015625, 0.6981201171875, 0.87078857421875, 1.04345703125, 1.21612548828125, 1.3887939453125, 1.56146240234375, 1.734130859375, 1.90679931640625, 2.0794677734375, 2.25213623046875, 2.4248046875, 2.59747314453125, 2.7701416015625, 2.94281005859375, 3.115478515625, 3.28814697265625, 3.4608154296875, 3.63348388671875, 3.80615234375, 3.97882080078125, 4.1514892578125, 4.32415771484375, 4.496826171875, 4.66949462890625, 4.8421630859375, 5.01483154296875, 5.1875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 7.0, 6.0, 15.0, 17.0, 31.0, 46.0, 70.0, 114.0, 182.0, 248.0, 363.0, 590.0, 985.0, 1471.0, 2215.0, 3528.0, 5497.0, 8714.0, 13520.0, 21144.0, 32937.0, 49381.0, 71936.0, 98746.0, 123992.0, 136211.0, 129247.0, 106980.0, 79856.0, 55633.0, 37338.0, 24236.0, 15870.0, 9981.0, 6197.0, 4060.0, 2563.0, 1601.0, 1049.0, 648.0, 466.0, 265.0, 184.0, 130.0, 95.0, 58.0, 49.0, 23.0, 20.0, 13.0, 8.0, 4.0, 5.0, 5.0, 1.0, 4.0], "bins": [-6.84375, -6.640380859375, -6.43701171875, -6.233642578125, -6.0302734375, -5.826904296875, -5.62353515625, -5.420166015625, -5.216796875, -5.013427734375, -4.81005859375, -4.606689453125, -4.4033203125, -4.199951171875, -3.99658203125, -3.793212890625, -3.58984375, -3.386474609375, -3.18310546875, -2.979736328125, -2.7763671875, -2.572998046875, -2.36962890625, -2.166259765625, -1.962890625, -1.759521484375, -1.55615234375, -1.352783203125, -1.1494140625, -0.946044921875, -0.74267578125, -0.539306640625, -0.3359375, -0.132568359375, 0.07080078125, 0.274169921875, 0.4775390625, 0.680908203125, 0.88427734375, 1.087646484375, 1.291015625, 1.494384765625, 1.69775390625, 1.901123046875, 2.1044921875, 2.307861328125, 2.51123046875, 2.714599609375, 2.91796875, 3.121337890625, 3.32470703125, 3.528076171875, 3.7314453125, 3.934814453125, 4.13818359375, 4.341552734375, 4.544921875, 4.748291015625, 4.95166015625, 5.155029296875, 5.3583984375, 5.561767578125, 5.76513671875, 5.968505859375, 6.171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 2.0, 6.0, 2.0, 10.0, 12.0, 15.0, 16.0, 13.0, 18.0, 24.0, 25.0, 29.0, 32.0, 33.0, 27.0, 22.0, 34.0, 47.0, 43.0, 52.0, 42.0, 37.0, 36.0, 35.0, 43.0, 34.0, 38.0, 42.0, 28.0, 25.0, 19.0, 21.0, 17.0, 13.0, 24.0, 12.0, 7.0, 11.0, 10.0, 14.0, 6.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.990234375, -3.870452880859375, -3.75067138671875, -3.630889892578125, -3.5111083984375, -3.391326904296875, -3.27154541015625, -3.151763916015625, -3.031982421875, -2.912200927734375, -2.79241943359375, -2.672637939453125, -2.5528564453125, -2.433074951171875, -2.31329345703125, -2.193511962890625, -2.07373046875, -1.953948974609375, -1.83416748046875, -1.714385986328125, -1.5946044921875, -1.474822998046875, -1.35504150390625, -1.235260009765625, -1.115478515625, -0.995697021484375, -0.87591552734375, -0.756134033203125, -0.6363525390625, -0.516571044921875, -0.39678955078125, -0.277008056640625, -0.1572265625, -0.037445068359375, 0.08233642578125, 0.202117919921875, 0.3218994140625, 0.441680908203125, 0.56146240234375, 0.681243896484375, 0.801025390625, 0.920806884765625, 1.04058837890625, 1.160369873046875, 1.2801513671875, 1.399932861328125, 1.51971435546875, 1.639495849609375, 1.75927734375, 1.879058837890625, 1.99884033203125, 2.118621826171875, 2.2384033203125, 2.358184814453125, 2.47796630859375, 2.597747802734375, 2.717529296875, 2.837310791015625, 2.95709228515625, 3.076873779296875, 3.1966552734375, 3.316436767578125, 3.43621826171875, 3.555999755859375, 3.67578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 6.0, 12.0, 12.0, 12.0, 17.0, 24.0, 31.0, 43.0, 57.0, 64.0, 98.0, 125.0, 164.0, 217.0, 289.0, 414.0, 656.0, 964.0, 1597.0, 2904.0, 5511.0, 11668.0, 29765.0, 98374.0, 366067.0, 372232.0, 101457.0, 30530.0, 11892.0, 5490.0, 2856.0, 1633.0, 1044.0, 654.0, 466.0, 339.0, 222.0, 172.0, 121.0, 93.0, 68.0, 46.0, 39.0, 29.0, 21.0, 15.0, 12.0, 7.0, 6.0, 4.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.7109375, -11.3450927734375, -10.979248046875, -10.6134033203125, -10.24755859375, -9.8817138671875, -9.515869140625, -9.1500244140625, -8.7841796875, -8.4183349609375, -8.052490234375, -7.6866455078125, -7.32080078125, -6.9549560546875, -6.589111328125, -6.2232666015625, -5.857421875, -5.4915771484375, -5.125732421875, -4.7598876953125, -4.39404296875, -4.0281982421875, -3.662353515625, -3.2965087890625, -2.9306640625, -2.5648193359375, -2.198974609375, -1.8331298828125, -1.46728515625, -1.1014404296875, -0.735595703125, -0.3697509765625, -0.00390625, 0.3619384765625, 0.727783203125, 1.0936279296875, 1.45947265625, 1.8253173828125, 2.191162109375, 2.5570068359375, 2.9228515625, 3.2886962890625, 3.654541015625, 4.0203857421875, 4.38623046875, 4.7520751953125, 5.117919921875, 5.4837646484375, 5.849609375, 6.2154541015625, 6.581298828125, 6.9471435546875, 7.31298828125, 7.6788330078125, 8.044677734375, 8.4105224609375, 8.7763671875, 9.1422119140625, 9.508056640625, 9.8739013671875, 10.23974609375, 10.6055908203125, 10.971435546875, 11.3372802734375, 11.703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 8.0, 4.0, 5.0, 12.0, 16.0, 19.0, 23.0, 40.0, 45.0, 76.0, 91.0, 83.0, 102.0, 97.0, 76.0, 59.0, 52.0, 43.0, 35.0, 24.0, 27.0, 12.0, 9.0, 6.0, 5.0, 9.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005993843078613281, -0.0005777403712272644, -0.0005560964345932007, -0.000534452497959137, -0.0005128085613250732, -0.0004911646246910095, -0.0004695206880569458, -0.0004478767514228821, -0.00042623281478881836, -0.00040458887815475464, -0.0003829449415206909, -0.0003613010048866272, -0.0003396570682525635, -0.00031801313161849976, -0.00029636919498443604, -0.0002747252583503723, -0.0002530813217163086, -0.00023143738508224487, -0.00020979344844818115, -0.00018814951181411743, -0.0001665055751800537, -0.00014486163854599, -0.00012321770191192627, -0.00010157376527786255, -7.992982864379883e-05, -5.828589200973511e-05, -3.664195537567139e-05, -1.4998018741607666e-05, 6.645917892456055e-06, 2.8289854526519775e-05, 4.9933791160583496e-05, 7.157772779464722e-05, 9.322166442871094e-05, 0.00011486560106277466, 0.00013650953769683838, 0.0001581534743309021, 0.00017979741096496582, 0.00020144134759902954, 0.00022308528423309326, 0.000244729220867157, 0.0002663731575012207, 0.0002880170941352844, 0.00030966103076934814, 0.00033130496740341187, 0.0003529489040374756, 0.0003745928406715393, 0.00039623677730560303, 0.00041788071393966675, 0.00043952465057373047, 0.0004611685872077942, 0.0004828125238418579, 0.0005044564604759216, 0.0005261003971099854, 0.0005477443337440491, 0.0005693882703781128, 0.0005910322070121765, 0.0006126761436462402, 0.000634320080280304, 0.0006559640169143677, 0.0006776079535484314, 0.0006992518901824951, 0.0007208958268165588, 0.0007425397634506226, 0.0007641837000846863, 0.00078582763671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 7.0, 11.0, 15.0, 15.0, 24.0, 17.0, 24.0, 42.0, 58.0, 62.0, 75.0, 122.0, 162.0, 218.0, 357.0, 497.0, 737.0, 1099.0, 1918.0, 3400.0, 6801.0, 15262.0, 40953.0, 133510.0, 373055.0, 312120.0, 100118.0, 31718.0, 12663.0, 5619.0, 2958.0, 1671.0, 1027.0, 672.0, 430.0, 286.0, 209.0, 152.0, 110.0, 94.0, 63.0, 46.0, 38.0, 25.0, 28.0, 20.0, 10.0, 8.0, 10.0, 4.0, 4.0, 6.0, 2.0, 4.0, 1.0, 4.0], "bins": [-9.765625, -9.4686279296875, -9.171630859375, -8.8746337890625, -8.57763671875, -8.2806396484375, -7.983642578125, -7.6866455078125, -7.3896484375, -7.0926513671875, -6.795654296875, -6.4986572265625, -6.20166015625, -5.9046630859375, -5.607666015625, -5.3106689453125, -5.013671875, -4.7166748046875, -4.419677734375, -4.1226806640625, -3.82568359375, -3.5286865234375, -3.231689453125, -2.9346923828125, -2.6376953125, -2.3406982421875, -2.043701171875, -1.7467041015625, -1.44970703125, -1.1527099609375, -0.855712890625, -0.5587158203125, -0.26171875, 0.0352783203125, 0.332275390625, 0.6292724609375, 0.92626953125, 1.2232666015625, 1.520263671875, 1.8172607421875, 2.1142578125, 2.4112548828125, 2.708251953125, 3.0052490234375, 3.30224609375, 3.5992431640625, 3.896240234375, 4.1932373046875, 4.490234375, 4.7872314453125, 5.084228515625, 5.3812255859375, 5.67822265625, 5.9752197265625, 6.272216796875, 6.5692138671875, 6.8662109375, 7.1632080078125, 7.460205078125, 7.7572021484375, 8.05419921875, 8.3511962890625, 8.648193359375, 8.9451904296875, 9.2421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 17.0, 19.0, 29.0, 40.0, 67.0, 95.0, 102.0, 118.0, 89.0, 101.0, 87.0, 55.0, 55.0, 44.0, 26.0, 6.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.317138671875, -3.21435546875, -3.111572265625, -3.0087890625, -2.906005859375, -2.80322265625, -2.700439453125, -2.59765625, -2.494873046875, -2.39208984375, -2.289306640625, -2.1865234375, -2.083740234375, -1.98095703125, -1.878173828125, -1.775390625, -1.672607421875, -1.56982421875, -1.467041015625, -1.3642578125, -1.261474609375, -1.15869140625, -1.055908203125, -0.953125, -0.850341796875, -0.74755859375, -0.644775390625, -0.5419921875, -0.439208984375, -0.33642578125, -0.233642578125, -0.130859375, -0.028076171875, 0.07470703125, 0.177490234375, 0.2802734375, 0.383056640625, 0.48583984375, 0.588623046875, 0.69140625, 0.794189453125, 0.89697265625, 0.999755859375, 1.1025390625, 1.205322265625, 1.30810546875, 1.410888671875, 1.513671875, 1.616455078125, 1.71923828125, 1.822021484375, 1.9248046875, 2.027587890625, 2.13037109375, 2.233154296875, 2.3359375, 2.438720703125, 2.54150390625, 2.644287109375, 2.7470703125, 2.849853515625, 2.95263671875, 3.055419921875, 3.158203125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 10.0, 7.0, 10.0, 15.0, 11.0, 21.0, 18.0, 27.0, 36.0, 48.0, 49.0, 56.0, 61.0, 63.0, 46.0, 49.0, 61.0, 45.0, 58.0, 36.0, 37.0, 30.0, 37.0, 29.0, 21.0, 20.0, 22.0, 14.0, 10.0, 8.0, 8.0, 10.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-7.927132606506348, -7.689866065979004, -7.452600002288818, -7.215333461761475, -6.978066921234131, -6.740800857543945, -6.503534317016602, -6.266267776489258, -6.029001235961914, -5.79173469543457, -5.554468631744385, -5.317202091217041, -5.079935550689697, -4.842669486999512, -4.605402946472168, -4.368136405944824, -4.1308698654174805, -3.893603563308716, -3.656337022781372, -3.4190707206726074, -3.1818041801452637, -2.944537878036499, -2.7072715759277344, -2.4700050354003906, -2.232738971710205, -1.9954725503921509, -1.7582061290740967, -1.520939826965332, -1.2836732864379883, -1.0464069843292236, -0.8091405630111694, -0.5718741416931152, -0.3346076011657715, -0.09734119474887848, 0.13992521166801453, 0.37719160318374634, 0.6144580245018005, 0.85172438621521, 1.0889908075332642, 1.3262572288513184, 1.5635236501693726, 1.8007900714874268, 2.0380563735961914, 2.275322914123535, 2.5125892162323, 2.7498555183410645, 2.987122058868408, 3.224388599395752, 3.4616549015045166, 3.6989212036132812, 3.936187744140625, 4.173454284667969, 4.410720348358154, 4.647986888885498, 4.885253429412842, 5.122519493103027, 5.359786033630371, 5.597052574157715, 5.8343186378479, 6.071585178375244, 6.308851718902588, 6.546117782592773, 6.783384323120117, 7.020650863647461, 7.257917404174805]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 7.0, 2.0, 1.0, 4.0, 6.0, 7.0, 9.0, 14.0, 16.0, 15.0, 15.0, 18.0, 21.0, 15.0, 31.0, 21.0, 23.0, 42.0, 42.0, 32.0, 37.0, 37.0, 36.0, 43.0, 36.0, 42.0, 46.0, 37.0, 40.0, 26.0, 29.0, 30.0, 34.0, 19.0, 15.0, 23.0, 21.0, 26.0, 18.0, 10.0, 15.0, 9.0, 4.0, 5.0, 4.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-6.335994720458984, -6.1490349769592285, -5.962075710296631, -5.775115966796875, -5.588156700134277, -5.4011969566345215, -5.214237213134766, -5.027277946472168, -4.840318202972412, -4.653358459472656, -4.466399192810059, -4.279439449310303, -4.092479705810547, -3.905520439147949, -3.7185606956481934, -3.5316011905670166, -3.34464168548584, -3.157682180404663, -2.9707226753234863, -2.7837629318237305, -2.5968034267425537, -2.409843921661377, -2.222884178161621, -2.0359246730804443, -1.8489651679992676, -1.6620056629180908, -1.4750460386276245, -1.2880864143371582, -1.1011269092559814, -0.9141673445701599, -0.7272077798843384, -0.5402481555938721, -0.3532891273498535, -0.16632956266403198, 0.02063000202178955, 0.20758956670761108, 0.3945491313934326, 0.5815086960792542, 0.7684682607650757, 0.955427885055542, 1.1423873901367188, 1.3293468952178955, 1.5163065195083618, 1.7032661437988281, 1.8902256488800049, 2.0771851539611816, 2.2641448974609375, 2.4511044025421143, 2.638063907623291, 2.8250234127044678, 3.0119829177856445, 3.1989426612854004, 3.385902166366577, 3.572861671447754, 3.7598214149475098, 3.9467809200286865, 4.133740425109863, 4.320700168609619, 4.507659435272217, 4.694619178771973, 4.88157844543457, 5.068538188934326, 5.255497932434082, 5.44245719909668, 5.6294169425964355]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 12.0, 18.0, 29.0, 36.0, 68.0, 88.0, 113.0, 169.0, 230.0, 348.0, 498.0, 748.0, 1147.0, 1635.0, 2678.0, 4162.0, 6902.0, 11587.0, 20572.0, 37771.0, 71804.0, 142179.0, 284993.0, 526598.0, 790143.0, 854713.0, 651836.0, 377189.0, 191198.0, 95952.0, 50262.0, 27498.0, 15557.0, 9176.0, 5621.0, 3551.0, 2355.0, 1526.0, 1024.0, 743.0, 491.0, 348.0, 247.0, 144.0, 110.0, 71.0, 50.0, 32.0, 19.0, 8.0, 13.0, 5.0, 6.0, 6.0], "bins": [-6.78125, -6.5887451171875, -6.396240234375, -6.2037353515625, -6.01123046875, -5.8187255859375, -5.626220703125, -5.4337158203125, -5.2412109375, -5.0487060546875, -4.856201171875, -4.6636962890625, -4.47119140625, -4.2786865234375, -4.086181640625, -3.8936767578125, -3.701171875, -3.5086669921875, -3.316162109375, -3.1236572265625, -2.93115234375, -2.7386474609375, -2.546142578125, -2.3536376953125, -2.1611328125, -1.9686279296875, -1.776123046875, -1.5836181640625, -1.39111328125, -1.1986083984375, -1.006103515625, -0.8135986328125, -0.62109375, -0.4285888671875, -0.236083984375, -0.0435791015625, 0.14892578125, 0.3414306640625, 0.533935546875, 0.7264404296875, 0.9189453125, 1.1114501953125, 1.303955078125, 1.4964599609375, 1.68896484375, 1.8814697265625, 2.073974609375, 2.2664794921875, 2.458984375, 2.6514892578125, 2.843994140625, 3.0364990234375, 3.22900390625, 3.4215087890625, 3.614013671875, 3.8065185546875, 3.9990234375, 4.1915283203125, 4.384033203125, 4.5765380859375, 4.76904296875, 4.9615478515625, 5.154052734375, 5.3465576171875, 5.5390625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 10.0, 11.0, 15.0, 8.0, 18.0, 13.0, 19.0, 18.0, 26.0, 22.0, 33.0, 32.0, 31.0, 33.0, 30.0, 49.0, 39.0, 27.0, 41.0, 47.0, 44.0, 47.0, 45.0, 38.0, 39.0, 32.0, 22.0, 22.0, 29.0, 20.0, 24.0, 14.0, 7.0, 13.0, 16.0, 8.0, 11.0, 4.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.58984375, -5.4237060546875, -5.257568359375, -5.0914306640625, -4.92529296875, -4.7591552734375, -4.593017578125, -4.4268798828125, -4.2607421875, -4.0946044921875, -3.928466796875, -3.7623291015625, -3.59619140625, -3.4300537109375, -3.263916015625, -3.0977783203125, -2.931640625, -2.7655029296875, -2.599365234375, -2.4332275390625, -2.26708984375, -2.1009521484375, -1.934814453125, -1.7686767578125, -1.6025390625, -1.4364013671875, -1.270263671875, -1.1041259765625, -0.93798828125, -0.7718505859375, -0.605712890625, -0.4395751953125, -0.2734375, -0.1072998046875, 0.058837890625, 0.2249755859375, 0.39111328125, 0.5572509765625, 0.723388671875, 0.8895263671875, 1.0556640625, 1.2218017578125, 1.387939453125, 1.5540771484375, 1.72021484375, 1.8863525390625, 2.052490234375, 2.2186279296875, 2.384765625, 2.5509033203125, 2.717041015625, 2.8831787109375, 3.04931640625, 3.2154541015625, 3.381591796875, 3.5477294921875, 3.7138671875, 3.8800048828125, 4.046142578125, 4.2122802734375, 4.37841796875, 4.5445556640625, 4.710693359375, 4.8768310546875, 5.04296875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 8.0, 16.0, 27.0, 39.0, 44.0, 69.0, 91.0, 126.0, 187.0, 269.0, 415.0, 669.0, 1073.0, 1577.0, 2512.0, 3938.0, 6375.0, 10698.0, 17882.0, 30457.0, 52551.0, 92962.0, 163372.0, 280831.0, 458692.0, 659545.0, 746639.0, 627490.0, 425561.0, 257988.0, 148962.0, 84381.0, 48394.0, 27949.0, 16691.0, 9734.0, 5832.0, 3621.0, 2320.0, 1529.0, 951.0, 653.0, 384.0, 276.0, 175.0, 111.0, 70.0, 42.0, 34.0, 20.0, 19.0, 15.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0], "bins": [-6.515625, -6.31463623046875, -6.1136474609375, -5.91265869140625, -5.711669921875, -5.51068115234375, -5.3096923828125, -5.10870361328125, -4.90771484375, -4.70672607421875, -4.5057373046875, -4.30474853515625, -4.103759765625, -3.90277099609375, -3.7017822265625, -3.50079345703125, -3.2998046875, -3.09881591796875, -2.8978271484375, -2.69683837890625, -2.495849609375, -2.29486083984375, -2.0938720703125, -1.89288330078125, -1.69189453125, -1.49090576171875, -1.2899169921875, -1.08892822265625, -0.887939453125, -0.68695068359375, -0.4859619140625, -0.28497314453125, -0.083984375, 0.11700439453125, 0.3179931640625, 0.51898193359375, 0.719970703125, 0.92095947265625, 1.1219482421875, 1.32293701171875, 1.52392578125, 1.72491455078125, 1.9259033203125, 2.12689208984375, 2.327880859375, 2.52886962890625, 2.7298583984375, 2.93084716796875, 3.1318359375, 3.33282470703125, 3.5338134765625, 3.73480224609375, 3.935791015625, 4.13677978515625, 4.3377685546875, 4.53875732421875, 4.73974609375, 4.94073486328125, 5.1417236328125, 5.34271240234375, 5.543701171875, 5.74468994140625, 5.9456787109375, 6.14666748046875, 6.34765625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 5.0, 15.0, 17.0, 25.0, 29.0, 33.0, 41.0, 37.0, 60.0, 53.0, 80.0, 96.0, 138.0, 129.0, 166.0, 198.0, 199.0, 210.0, 221.0, 240.0, 266.0, 249.0, 225.0, 234.0, 169.0, 167.0, 143.0, 124.0, 89.0, 92.0, 78.0, 45.0, 47.0, 19.0, 27.0, 20.0, 20.0, 14.0, 14.0, 8.0, 8.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.791015625, -2.713531494140625, -2.63604736328125, -2.558563232421875, -2.4810791015625, -2.403594970703125, -2.32611083984375, -2.248626708984375, -2.171142578125, -2.093658447265625, -2.01617431640625, -1.938690185546875, -1.8612060546875, -1.783721923828125, -1.70623779296875, -1.628753662109375, -1.55126953125, -1.473785400390625, -1.39630126953125, -1.318817138671875, -1.2413330078125, -1.163848876953125, -1.08636474609375, -1.008880615234375, -0.931396484375, -0.853912353515625, -0.77642822265625, -0.698944091796875, -0.6214599609375, -0.543975830078125, -0.46649169921875, -0.389007568359375, -0.3115234375, -0.234039306640625, -0.15655517578125, -0.079071044921875, -0.0015869140625, 0.075897216796875, 0.15338134765625, 0.230865478515625, 0.308349609375, 0.385833740234375, 0.46331787109375, 0.540802001953125, 0.6182861328125, 0.695770263671875, 0.77325439453125, 0.850738525390625, 0.92822265625, 1.005706787109375, 1.08319091796875, 1.160675048828125, 1.2381591796875, 1.315643310546875, 1.39312744140625, 1.470611572265625, 1.548095703125, 1.625579833984375, 1.70306396484375, 1.780548095703125, 1.8580322265625, 1.935516357421875, 2.01300048828125, 2.090484619140625, 2.16796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 5.0, 4.0, 12.0, 8.0, 17.0, 11.0, 21.0, 20.0, 27.0, 21.0, 24.0, 36.0, 38.0, 48.0, 47.0, 38.0, 40.0, 55.0, 56.0, 44.0, 36.0, 50.0, 38.0, 44.0, 43.0, 32.0, 25.0, 28.0, 20.0, 19.0, 19.0, 12.0, 9.0, 9.0, 10.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.262025356292725, -6.049343585968018, -5.836662292480469, -5.623980522155762, -5.411298751831055, -5.198617458343506, -4.985935688018799, -4.77325439453125, -4.560572624206543, -4.347890853881836, -4.135209560394287, -3.92252779006958, -3.709846258163452, -3.497164726257324, -3.284482955932617, -3.0718014240264893, -2.8591196537017822, -2.6464381217956543, -2.4337563514709473, -2.2210748195648193, -2.0083932876586914, -1.795711636543274, -1.5830299854278564, -1.3703484535217285, -1.157666802406311, -0.9449852108955383, -0.7323036193847656, -0.5196219682693481, -0.30694037675857544, -0.09425878524780273, 0.11842286586761475, 0.3311043977737427, 0.5437860488891602, 0.7564676403999329, 0.9691492319107056, 1.181830883026123, 1.394512414932251, 1.6071940660476685, 1.819875717163086, 2.032557249069214, 2.245238780975342, 2.4579203128814697, 2.6706020832061768, 2.8832836151123047, 3.0959651470184326, 3.3086466789245605, 3.5213284492492676, 3.7340099811553955, 3.9466917514801025, 4.1593732833862305, 4.3720550537109375, 4.5847368240356445, 4.797418117523193, 5.0100998878479, 5.222781181335449, 5.435462951660156, 5.648144721984863, 5.86082649230957, 6.073507785797119, 6.286189556121826, 6.498871326446533, 6.711552619934082, 6.924234390258789, 7.136916160583496, 7.349597454071045]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 10.0, 2.0, 9.0, 11.0, 11.0, 14.0, 10.0, 10.0, 23.0, 16.0, 23.0, 27.0, 27.0, 25.0, 37.0, 38.0, 41.0, 43.0, 49.0, 46.0, 49.0, 35.0, 44.0, 33.0, 41.0, 41.0, 32.0, 22.0, 34.0, 28.0, 27.0, 18.0, 20.0, 16.0, 21.0, 13.0, 9.0, 11.0, 7.0, 9.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0], "bins": [-6.842390060424805, -6.6507062911987305, -6.459022045135498, -6.267338275909424, -6.075654029846191, -5.883970260620117, -5.692286491394043, -5.500602722167969, -5.308918476104736, -5.117234706878662, -4.92555046081543, -4.7338666915893555, -4.542182922363281, -4.350498676300049, -4.158814907073975, -3.9671308994293213, -3.775446891784668, -3.5837628841400146, -3.3920788764953613, -3.200395107269287, -3.008711099624634, -2.8170270919799805, -2.6253433227539062, -2.433659315109253, -2.2419753074645996, -2.0502912998199463, -1.8586074113845825, -1.6669235229492188, -1.4752395153045654, -1.283555507659912, -1.0918716192245483, -0.9001877307891846, -0.7085037231445312, -0.5168197751045227, -0.32513582706451416, -0.13345187902450562, 0.05823206901550293, 0.24991601705551147, 0.44159996509552, 0.6332838535308838, 0.8249678611755371, 1.0166518688201904, 1.2083357572555542, 1.400019645690918, 1.5917036533355713, 1.7833876609802246, 1.9750715494155884, 2.166755437850952, 2.3584394454956055, 2.550123453140259, 2.741807460784912, 2.9334912300109863, 3.1251752376556396, 3.316859245300293, 3.508543014526367, 3.7002270221710205, 3.891911029815674, 4.083594799041748, 4.2752790451049805, 4.466962814331055, 4.658646583557129, 4.850330829620361, 5.0420145988464355, 5.233698844909668, 5.425382614135742]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 9.0, 13.0, 30.0, 29.0, 41.0, 64.0, 111.0, 163.0, 240.0, 401.0, 657.0, 1101.0, 1876.0, 3253.0, 5724.0, 9906.0, 18040.0, 33226.0, 62570.0, 117048.0, 191714.0, 224887.0, 167495.0, 96439.0, 51478.0, 27256.0, 14773.0, 8374.0, 4716.0, 2776.0, 1615.0, 952.0, 618.0, 341.0, 241.0, 133.0, 80.0, 54.0, 27.0, 27.0, 19.0, 11.0, 8.0, 2.0, 8.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.47265625, -5.31329345703125, -5.1539306640625, -4.99456787109375, -4.835205078125, -4.67584228515625, -4.5164794921875, -4.35711669921875, -4.19775390625, -4.03839111328125, -3.8790283203125, -3.71966552734375, -3.560302734375, -3.40093994140625, -3.2415771484375, -3.08221435546875, -2.9228515625, -2.76348876953125, -2.6041259765625, -2.44476318359375, -2.285400390625, -2.12603759765625, -1.9666748046875, -1.80731201171875, -1.64794921875, -1.48858642578125, -1.3292236328125, -1.16986083984375, -1.010498046875, -0.85113525390625, -0.6917724609375, -0.53240966796875, -0.373046875, -0.21368408203125, -0.0543212890625, 0.10504150390625, 0.264404296875, 0.42376708984375, 0.5831298828125, 0.74249267578125, 0.90185546875, 1.06121826171875, 1.2205810546875, 1.37994384765625, 1.539306640625, 1.69866943359375, 1.8580322265625, 2.01739501953125, 2.1767578125, 2.33612060546875, 2.4954833984375, 2.65484619140625, 2.814208984375, 2.97357177734375, 3.1329345703125, 3.29229736328125, 3.45166015625, 3.61102294921875, 3.7703857421875, 3.92974853515625, 4.089111328125, 4.24847412109375, 4.4078369140625, 4.56719970703125, 4.7265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 1.0, 6.0, 6.0, 13.0, 5.0, 14.0, 11.0, 17.0, 13.0, 17.0, 27.0, 28.0, 24.0, 26.0, 34.0, 36.0, 36.0, 44.0, 39.0, 49.0, 55.0, 39.0, 44.0, 41.0, 36.0, 36.0, 40.0, 36.0, 33.0, 25.0, 35.0, 14.0, 22.0, 24.0, 19.0, 12.0, 7.0, 10.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.5, -7.2926025390625, -7.085205078125, -6.8778076171875, -6.67041015625, -6.4630126953125, -6.255615234375, -6.0482177734375, -5.8408203125, -5.6334228515625, -5.426025390625, -5.2186279296875, -5.01123046875, -4.8038330078125, -4.596435546875, -4.3890380859375, -4.181640625, -3.9742431640625, -3.766845703125, -3.5594482421875, -3.35205078125, -3.1446533203125, -2.937255859375, -2.7298583984375, -2.5224609375, -2.3150634765625, -2.107666015625, -1.9002685546875, -1.69287109375, -1.4854736328125, -1.278076171875, -1.0706787109375, -0.86328125, -0.6558837890625, -0.448486328125, -0.2410888671875, -0.03369140625, 0.1737060546875, 0.381103515625, 0.5885009765625, 0.7958984375, 1.0032958984375, 1.210693359375, 1.4180908203125, 1.62548828125, 1.8328857421875, 2.040283203125, 2.2476806640625, 2.455078125, 2.6624755859375, 2.869873046875, 3.0772705078125, 3.28466796875, 3.4920654296875, 3.699462890625, 3.9068603515625, 4.1142578125, 4.3216552734375, 4.529052734375, 4.7364501953125, 4.94384765625, 5.1512451171875, 5.358642578125, 5.5660400390625, 5.7734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 8.0, 16.0, 10.0, 8.0, 24.0, 23.0, 46.0, 53.0, 90.0, 115.0, 182.0, 275.0, 407.0, 673.0, 1108.0, 1816.0, 3203.0, 5752.0, 10803.0, 21491.0, 66636.0, 803441.0, 83245.0, 23375.0, 11469.0, 5977.0, 3317.0, 1928.0, 1123.0, 680.0, 433.0, 268.0, 173.0, 109.0, 79.0, 49.0, 40.0, 25.0, 15.0, 14.0, 11.0, 10.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.546875, -10.2125244140625, -9.878173828125, -9.5438232421875, -9.20947265625, -8.8751220703125, -8.540771484375, -8.2064208984375, -7.8720703125, -7.5377197265625, -7.203369140625, -6.8690185546875, -6.53466796875, -6.2003173828125, -5.865966796875, -5.5316162109375, -5.197265625, -4.8629150390625, -4.528564453125, -4.1942138671875, -3.85986328125, -3.5255126953125, -3.191162109375, -2.8568115234375, -2.5224609375, -2.1881103515625, -1.853759765625, -1.5194091796875, -1.18505859375, -0.8507080078125, -0.516357421875, -0.1820068359375, 0.15234375, 0.4866943359375, 0.821044921875, 1.1553955078125, 1.48974609375, 1.8240966796875, 2.158447265625, 2.4927978515625, 2.8271484375, 3.1614990234375, 3.495849609375, 3.8302001953125, 4.16455078125, 4.4989013671875, 4.833251953125, 5.1676025390625, 5.501953125, 5.8363037109375, 6.170654296875, 6.5050048828125, 6.83935546875, 7.1737060546875, 7.508056640625, 7.8424072265625, 8.1767578125, 8.5111083984375, 8.845458984375, 9.1798095703125, 9.51416015625, 9.8485107421875, 10.182861328125, 10.5172119140625, 10.8515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 4.0, 1.0, 3.0, 8.0, 7.0, 8.0, 15.0, 9.0, 12.0, 11.0, 17.0, 23.0, 24.0, 25.0, 27.0, 29.0, 30.0, 33.0, 38.0, 37.0, 53.0, 45.0, 39.0, 51.0, 57.0, 39.0, 42.0, 37.0, 36.0, 29.0, 32.0, 24.0, 19.0, 21.0, 23.0, 15.0, 12.0, 14.0, 12.0, 7.0, 5.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-5.72265625, -5.54510498046875, -5.3675537109375, -5.19000244140625, -5.012451171875, -4.83489990234375, -4.6573486328125, -4.47979736328125, -4.30224609375, -4.12469482421875, -3.9471435546875, -3.76959228515625, -3.592041015625, -3.41448974609375, -3.2369384765625, -3.05938720703125, -2.8818359375, -2.70428466796875, -2.5267333984375, -2.34918212890625, -2.171630859375, -1.99407958984375, -1.8165283203125, -1.63897705078125, -1.46142578125, -1.28387451171875, -1.1063232421875, -0.92877197265625, -0.751220703125, -0.57366943359375, -0.3961181640625, -0.21856689453125, -0.041015625, 0.13653564453125, 0.3140869140625, 0.49163818359375, 0.669189453125, 0.84674072265625, 1.0242919921875, 1.20184326171875, 1.37939453125, 1.55694580078125, 1.7344970703125, 1.91204833984375, 2.089599609375, 2.26715087890625, 2.4447021484375, 2.62225341796875, 2.7998046875, 2.97735595703125, 3.1549072265625, 3.33245849609375, 3.510009765625, 3.68756103515625, 3.8651123046875, 4.04266357421875, 4.22021484375, 4.39776611328125, 4.5753173828125, 4.75286865234375, 4.930419921875, 5.10797119140625, 5.2855224609375, 5.46307373046875, 5.640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 13.0, 5.0, 20.0, 18.0, 28.0, 27.0, 29.0, 76.0, 89.0, 142.0, 178.0, 278.0, 446.0, 795.0, 1296.0, 2618.0, 5167.0, 11604.0, 34558.0, 653391.0, 290344.0, 27247.0, 10059.0, 4683.0, 2214.0, 1251.0, 738.0, 410.0, 266.0, 181.0, 128.0, 78.0, 48.0, 40.0, 27.0, 18.0, 15.0, 6.0, 10.0, 6.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.446258544921875, -2.36712646484375, -2.287994384765625, -2.2088623046875, -2.129730224609375, -2.05059814453125, -1.971466064453125, -1.892333984375, -1.813201904296875, -1.73406982421875, -1.654937744140625, -1.5758056640625, -1.496673583984375, -1.41754150390625, -1.338409423828125, -1.25927734375, -1.180145263671875, -1.10101318359375, -1.021881103515625, -0.9427490234375, -0.863616943359375, -0.78448486328125, -0.705352783203125, -0.626220703125, -0.547088623046875, -0.46795654296875, -0.388824462890625, -0.3096923828125, -0.230560302734375, -0.15142822265625, -0.072296142578125, 0.0068359375, 0.085968017578125, 0.16510009765625, 0.244232177734375, 0.3233642578125, 0.402496337890625, 0.48162841796875, 0.560760498046875, 0.639892578125, 0.719024658203125, 0.79815673828125, 0.877288818359375, 0.9564208984375, 1.035552978515625, 1.11468505859375, 1.193817138671875, 1.27294921875, 1.352081298828125, 1.43121337890625, 1.510345458984375, 1.5894775390625, 1.668609619140625, 1.74774169921875, 1.826873779296875, 1.906005859375, 1.985137939453125, 2.06427001953125, 2.143402099609375, 2.2225341796875, 2.301666259765625, 2.38079833984375, 2.459930419921875, 2.5390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 1.0, 7.0, 13.0, 14.0, 28.0, 36.0, 55.0, 81.0, 131.0, 190.0, 146.0, 85.0, 68.0, 33.0, 33.0, 15.0, 17.0, 12.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005517005920410156, -0.0005330741405487061, -0.0005144476890563965, -0.0004958212375640869, -0.00047719478607177734, -0.0004585683345794678, -0.0004399418830871582, -0.00042131543159484863, -0.00040268898010253906, -0.0003840625286102295, -0.0003654360771179199, -0.00034680962562561035, -0.0003281831741333008, -0.0003095567226409912, -0.00029093027114868164, -0.00027230381965637207, -0.0002536773681640625, -0.00023505091667175293, -0.00021642446517944336, -0.0001977980136871338, -0.00017917156219482422, -0.00016054511070251465, -0.00014191865921020508, -0.0001232922077178955, -0.00010466575622558594, -8.603930473327637e-05, -6.74128532409668e-05, -4.8786401748657227e-05, -3.0159950256347656e-05, -1.1533498764038086e-05, 7.092952728271484e-06, 2.5719404220581055e-05, 4.4345855712890625e-05, 6.29723072052002e-05, 8.159875869750977e-05, 0.00010022521018981934, 0.0001188516616821289, 0.00013747811317443848, 0.00015610456466674805, 0.00017473101615905762, 0.0001933574676513672, 0.00021198391914367676, 0.00023061037063598633, 0.0002492368221282959, 0.00026786327362060547, 0.00028648972511291504, 0.0003051161766052246, 0.0003237426280975342, 0.00034236907958984375, 0.0003609955310821533, 0.0003796219825744629, 0.00039824843406677246, 0.00041687488555908203, 0.0004355013370513916, 0.00045412778854370117, 0.00047275424003601074, 0.0004913806915283203, 0.0005100071430206299, 0.0005286335945129395, 0.000547260046005249, 0.0005658864974975586, 0.0005845129489898682, 0.0006031394004821777, 0.0006217658519744873, 0.0006403923034667969]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 7.0, 14.0, 22.0, 20.0, 23.0, 37.0, 51.0, 90.0, 130.0, 155.0, 224.0, 307.0, 483.0, 708.0, 1063.0, 1751.0, 2881.0, 5086.0, 8956.0, 17000.0, 34451.0, 76930.0, 200499.0, 361133.0, 191507.0, 73764.0, 33199.0, 16489.0, 8761.0, 4874.0, 2825.0, 1698.0, 1068.0, 729.0, 479.0, 352.0, 243.0, 185.0, 114.0, 76.0, 48.0, 41.0, 21.0, 12.0, 17.0, 11.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.6513671875, -1.6034698486328125, -1.555572509765625, -1.5076751708984375, -1.45977783203125, -1.4118804931640625, -1.363983154296875, -1.3160858154296875, -1.2681884765625, -1.2202911376953125, -1.172393798828125, -1.1244964599609375, -1.07659912109375, -1.0287017822265625, -0.980804443359375, -0.9329071044921875, -0.885009765625, -0.8371124267578125, -0.789215087890625, -0.7413177490234375, -0.69342041015625, -0.6455230712890625, -0.597625732421875, -0.5497283935546875, -0.5018310546875, -0.4539337158203125, -0.406036376953125, -0.3581390380859375, -0.31024169921875, -0.2623443603515625, -0.214447021484375, -0.1665496826171875, -0.11865234375, -0.0707550048828125, -0.022857666015625, 0.0250396728515625, 0.07293701171875, 0.1208343505859375, 0.168731689453125, 0.2166290283203125, 0.2645263671875, 0.3124237060546875, 0.360321044921875, 0.4082183837890625, 0.45611572265625, 0.5040130615234375, 0.551910400390625, 0.5998077392578125, 0.647705078125, 0.6956024169921875, 0.743499755859375, 0.7913970947265625, 0.83929443359375, 0.8871917724609375, 0.935089111328125, 0.9829864501953125, 1.0308837890625, 1.0787811279296875, 1.126678466796875, 1.1745758056640625, 1.22247314453125, 1.2703704833984375, 1.318267822265625, 1.3661651611328125, 1.4140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 2.0, 6.0, 7.0, 10.0, 14.0, 14.0, 20.0, 18.0, 22.0, 29.0, 29.0, 37.0, 49.0, 46.0, 63.0, 57.0, 76.0, 57.0, 68.0, 54.0, 42.0, 56.0, 37.0, 36.0, 37.0, 20.0, 19.0, 12.0, 16.0, 6.0, 12.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.358154296875, -0.3468589782714844, -0.33556365966796875, -0.3242683410644531, -0.3129730224609375, -0.3016777038574219, -0.29038238525390625, -0.2790870666503906, -0.267791748046875, -0.2564964294433594, -0.24520111083984375, -0.23390579223632812, -0.2226104736328125, -0.21131515502929688, -0.20001983642578125, -0.18872451782226562, -0.17742919921875, -0.16613388061523438, -0.15483856201171875, -0.14354324340820312, -0.1322479248046875, -0.12095260620117188, -0.10965728759765625, -0.09836196899414062, -0.087066650390625, -0.07577133178710938, -0.06447601318359375, -0.053180694580078125, -0.0418853759765625, -0.030590057373046875, -0.01929473876953125, -0.007999420166015625, 0.0032958984375, 0.014591217041015625, 0.02588653564453125, 0.037181854248046875, 0.0484771728515625, 0.059772491455078125, 0.07106781005859375, 0.08236312866210938, 0.093658447265625, 0.10495376586914062, 0.11624908447265625, 0.12754440307617188, 0.1388397216796875, 0.15013504028320312, 0.16143035888671875, 0.17272567749023438, 0.18402099609375, 0.19531631469726562, 0.20661163330078125, 0.21790695190429688, 0.2292022705078125, 0.24049758911132812, 0.25179290771484375, 0.2630882263183594, 0.274383544921875, 0.2856788635253906, 0.29697418212890625, 0.3082695007324219, 0.3195648193359375, 0.3308601379394531, 0.34215545654296875, 0.3534507751464844, 0.36474609375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 9.0, 13.0, 15.0, 13.0, 12.0, 15.0, 25.0, 21.0, 26.0, 22.0, 34.0, 39.0, 42.0, 43.0, 47.0, 46.0, 38.0, 53.0, 62.0, 51.0, 46.0, 52.0, 45.0, 30.0, 34.0, 23.0, 19.0, 10.0, 24.0, 16.0, 17.0, 12.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.891582489013672, -5.6769866943359375, -5.462390422821045, -5.2477946281433105, -5.033198833465576, -4.818602561950684, -4.604006767272949, -4.389410972595215, -4.1748151779174805, -3.960219144821167, -3.7456233501434326, -3.531027317047119, -3.3164315223693848, -3.1018354892730713, -2.887239456176758, -2.6726436614990234, -2.458047389984131, -2.2434513568878174, -2.028855562210083, -1.8142595291137695, -1.5996636152267456, -1.3850677013397217, -1.1704716682434082, -0.9558757543563843, -0.7412798404693604, -0.5266839265823364, -0.3120879530906677, -0.09749197959899902, 0.1171039342880249, 0.33169984817504883, 0.5462958812713623, 0.7608917951583862, 0.9754881858825684, 1.1900840997695923, 1.4046800136566162, 1.6192760467529297, 1.8338719606399536, 2.0484678745269775, 2.263063907623291, 2.4776597023010254, 2.692255735397339, 2.9068517684936523, 3.1214475631713867, 3.3360435962677, 3.5506396293640137, 3.765235424041748, 3.9798314571380615, 4.194427490234375, 4.409023284912109, 4.623619079589844, 4.838215351104736, 5.052811145782471, 5.267406940460205, 5.482003211975098, 5.696599006652832, 5.911194801330566, 6.125790596008301, 6.340386390686035, 6.554982662200928, 6.769578456878662, 6.9841742515563965, 7.198770523071289, 7.413366317749023, 7.627962112426758, 7.84255838394165]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 8.0, 10.0, 9.0, 14.0, 12.0, 19.0, 18.0, 10.0, 27.0, 25.0, 34.0, 25.0, 34.0, 41.0, 32.0, 49.0, 59.0, 45.0, 49.0, 36.0, 36.0, 33.0, 38.0, 38.0, 28.0, 32.0, 23.0, 30.0, 22.0, 26.0, 24.0, 21.0, 18.0, 16.0, 8.0, 8.0, 3.0, 9.0, 2.0, 4.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.5802998542785645, -6.383635520935059, -6.186971187591553, -5.990306854248047, -5.793642520904541, -5.596978187561035, -5.400313854217529, -5.203649520874023, -5.006985187530518, -4.810320854187012, -4.613656520843506, -4.4169921875, -4.220327854156494, -4.023663520812988, -3.8269991874694824, -3.6303348541259766, -3.4336705207824707, -3.237006187438965, -3.040341854095459, -2.843677520751953, -2.6470131874084473, -2.4503488540649414, -2.2536845207214355, -2.0570201873779297, -1.8603558540344238, -1.663691520690918, -1.467027187347412, -1.2703628540039062, -1.0736985206604004, -0.8770341873168945, -0.6803698539733887, -0.4837055206298828, -0.28704071044921875, -0.09037637710571289, 0.10628795623779297, 0.30295228958129883, 0.4996166229248047, 0.6962809562683105, 0.8929452896118164, 1.0896096229553223, 1.2862739562988281, 1.482938289642334, 1.6796026229858398, 1.8762669563293457, 2.0729312896728516, 2.2695956230163574, 2.4662599563598633, 2.662924289703369, 2.859588623046875, 3.056252956390381, 3.2529172897338867, 3.4495816230773926, 3.6462459564208984, 3.8429102897644043, 4.03957462310791, 4.236238956451416, 4.432903289794922, 4.629567623138428, 4.826231956481934, 5.0228962898254395, 5.219560623168945, 5.416224956512451, 5.612889289855957, 5.809553623199463, 6.006217956542969]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 17.0, 18.0, 36.0, 48.0, 76.0, 105.0, 147.0, 220.0, 327.0, 539.0, 792.0, 1186.0, 1883.0, 2901.0, 4608.0, 7041.0, 11492.0, 18395.0, 28325.0, 44422.0, 66380.0, 93960.0, 122649.0, 139856.0, 137084.0, 114539.0, 85857.0, 58731.0, 39035.0, 24566.0, 15978.0, 9822.0, 6309.0, 3950.0, 2579.0, 1631.0, 1042.0, 667.0, 420.0, 295.0, 222.0, 142.0, 79.0, 69.0, 39.0, 23.0, 25.0, 6.0, 14.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.7734375, -5.5921630859375, -5.410888671875, -5.2296142578125, -5.04833984375, -4.8670654296875, -4.685791015625, -4.5045166015625, -4.3232421875, -4.1419677734375, -3.960693359375, -3.7794189453125, -3.59814453125, -3.4168701171875, -3.235595703125, -3.0543212890625, -2.873046875, -2.6917724609375, -2.510498046875, -2.3292236328125, -2.14794921875, -1.9666748046875, -1.785400390625, -1.6041259765625, -1.4228515625, -1.2415771484375, -1.060302734375, -0.8790283203125, -0.69775390625, -0.5164794921875, -0.335205078125, -0.1539306640625, 0.02734375, 0.2086181640625, 0.389892578125, 0.5711669921875, 0.75244140625, 0.9337158203125, 1.114990234375, 1.2962646484375, 1.4775390625, 1.6588134765625, 1.840087890625, 2.0213623046875, 2.20263671875, 2.3839111328125, 2.565185546875, 2.7464599609375, 2.927734375, 3.1090087890625, 3.290283203125, 3.4715576171875, 3.65283203125, 3.8341064453125, 4.015380859375, 4.1966552734375, 4.3779296875, 4.5592041015625, 4.740478515625, 4.9217529296875, 5.10302734375, 5.2843017578125, 5.465576171875, 5.6468505859375, 5.828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 5.0, 2.0, 4.0, 7.0, 10.0, 17.0, 13.0, 8.0, 13.0, 17.0, 36.0, 23.0, 26.0, 33.0, 33.0, 39.0, 29.0, 41.0, 52.0, 45.0, 46.0, 51.0, 46.0, 33.0, 33.0, 35.0, 42.0, 40.0, 27.0, 27.0, 25.0, 23.0, 31.0, 17.0, 15.0, 8.0, 9.0, 13.0, 6.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-7.2578125, -7.056396484375, -6.85498046875, -6.653564453125, -6.4521484375, -6.250732421875, -6.04931640625, -5.847900390625, -5.646484375, -5.445068359375, -5.24365234375, -5.042236328125, -4.8408203125, -4.639404296875, -4.43798828125, -4.236572265625, -4.03515625, -3.833740234375, -3.63232421875, -3.430908203125, -3.2294921875, -3.028076171875, -2.82666015625, -2.625244140625, -2.423828125, -2.222412109375, -2.02099609375, -1.819580078125, -1.6181640625, -1.416748046875, -1.21533203125, -1.013916015625, -0.8125, -0.611083984375, -0.40966796875, -0.208251953125, -0.0068359375, 0.194580078125, 0.39599609375, 0.597412109375, 0.798828125, 1.000244140625, 1.20166015625, 1.403076171875, 1.6044921875, 1.805908203125, 2.00732421875, 2.208740234375, 2.41015625, 2.611572265625, 2.81298828125, 3.014404296875, 3.2158203125, 3.417236328125, 3.61865234375, 3.820068359375, 4.021484375, 4.222900390625, 4.42431640625, 4.625732421875, 4.8271484375, 5.028564453125, 5.22998046875, 5.431396484375, 5.6328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 11.0, 23.0, 24.0, 40.0, 47.0, 69.0, 112.0, 177.0, 268.0, 377.0, 601.0, 867.0, 1327.0, 1946.0, 2975.0, 4356.0, 6874.0, 10438.0, 16507.0, 25291.0, 38190.0, 56267.0, 80993.0, 106708.0, 127317.0, 132452.0, 120638.0, 97970.0, 71592.0, 49626.0, 33005.0, 21185.0, 14021.0, 8976.0, 5802.0, 3928.0, 2526.0, 1718.0, 1056.0, 736.0, 475.0, 355.0, 225.0, 143.0, 130.0, 58.0, 51.0, 30.0, 17.0, 15.0, 9.0, 4.0, 5.0, 6.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.10546875, -5.9105224609375, -5.715576171875, -5.5206298828125, -5.32568359375, -5.1307373046875, -4.935791015625, -4.7408447265625, -4.5458984375, -4.3509521484375, -4.156005859375, -3.9610595703125, -3.76611328125, -3.5711669921875, -3.376220703125, -3.1812744140625, -2.986328125, -2.7913818359375, -2.596435546875, -2.4014892578125, -2.20654296875, -2.0115966796875, -1.816650390625, -1.6217041015625, -1.4267578125, -1.2318115234375, -1.036865234375, -0.8419189453125, -0.64697265625, -0.4520263671875, -0.257080078125, -0.0621337890625, 0.1328125, 0.3277587890625, 0.522705078125, 0.7176513671875, 0.91259765625, 1.1075439453125, 1.302490234375, 1.4974365234375, 1.6923828125, 1.8873291015625, 2.082275390625, 2.2772216796875, 2.47216796875, 2.6671142578125, 2.862060546875, 3.0570068359375, 3.251953125, 3.4468994140625, 3.641845703125, 3.8367919921875, 4.03173828125, 4.2266845703125, 4.421630859375, 4.6165771484375, 4.8115234375, 5.0064697265625, 5.201416015625, 5.3963623046875, 5.59130859375, 5.7862548828125, 5.981201171875, 6.1761474609375, 6.37109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 5.0, 9.0, 3.0, 9.0, 8.0, 8.0, 12.0, 11.0, 15.0, 13.0, 29.0, 38.0, 25.0, 33.0, 33.0, 32.0, 34.0, 49.0, 44.0, 32.0, 38.0, 41.0, 50.0, 41.0, 43.0, 37.0, 36.0, 30.0, 37.0, 34.0, 24.0, 23.0, 16.0, 9.0, 18.0, 20.0, 8.0, 9.0, 8.0, 11.0, 8.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.512969970703125, -3.39117431640625, -3.269378662109375, -3.1475830078125, -3.025787353515625, -2.90399169921875, -2.782196044921875, -2.660400390625, -2.538604736328125, -2.41680908203125, -2.295013427734375, -2.1732177734375, -2.051422119140625, -1.92962646484375, -1.807830810546875, -1.68603515625, -1.564239501953125, -1.44244384765625, -1.320648193359375, -1.1988525390625, -1.077056884765625, -0.95526123046875, -0.833465576171875, -0.711669921875, -0.589874267578125, -0.46807861328125, -0.346282958984375, -0.2244873046875, -0.102691650390625, 0.01910400390625, 0.140899658203125, 0.2626953125, 0.384490966796875, 0.50628662109375, 0.628082275390625, 0.7498779296875, 0.871673583984375, 0.99346923828125, 1.115264892578125, 1.237060546875, 1.358856201171875, 1.48065185546875, 1.602447509765625, 1.7242431640625, 1.846038818359375, 1.96783447265625, 2.089630126953125, 2.21142578125, 2.333221435546875, 2.45501708984375, 2.576812744140625, 2.6986083984375, 2.820404052734375, 2.94219970703125, 3.063995361328125, 3.185791015625, 3.307586669921875, 3.42938232421875, 3.551177978515625, 3.6729736328125, 3.794769287109375, 3.91656494140625, 4.038360595703125, 4.16015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 4.0, 9.0, 5.0, 7.0, 14.0, 10.0, 26.0, 33.0, 41.0, 75.0, 84.0, 108.0, 169.0, 240.0, 339.0, 479.0, 741.0, 1060.0, 1546.0, 2472.0, 3802.0, 6103.0, 10114.0, 17144.0, 31079.0, 57401.0, 106904.0, 178893.0, 219063.0, 175251.0, 104485.0, 56539.0, 30444.0, 16805.0, 9978.0, 5914.0, 3765.0, 2454.0, 1569.0, 1036.0, 724.0, 467.0, 341.0, 242.0, 171.0, 127.0, 90.0, 64.0, 34.0, 42.0, 15.0, 10.0, 9.0, 10.0, 10.0, 7.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.21484375, -4.0850830078125, -3.955322265625, -3.8255615234375, -3.69580078125, -3.5660400390625, -3.436279296875, -3.3065185546875, -3.1767578125, -3.0469970703125, -2.917236328125, -2.7874755859375, -2.65771484375, -2.5279541015625, -2.398193359375, -2.2684326171875, -2.138671875, -2.0089111328125, -1.879150390625, -1.7493896484375, -1.61962890625, -1.4898681640625, -1.360107421875, -1.2303466796875, -1.1005859375, -0.9708251953125, -0.841064453125, -0.7113037109375, -0.58154296875, -0.4517822265625, -0.322021484375, -0.1922607421875, -0.0625, 0.0672607421875, 0.197021484375, 0.3267822265625, 0.45654296875, 0.5863037109375, 0.716064453125, 0.8458251953125, 0.9755859375, 1.1053466796875, 1.235107421875, 1.3648681640625, 1.49462890625, 1.6243896484375, 1.754150390625, 1.8839111328125, 2.013671875, 2.1434326171875, 2.273193359375, 2.4029541015625, 2.53271484375, 2.6624755859375, 2.792236328125, 2.9219970703125, 3.0517578125, 3.1815185546875, 3.311279296875, 3.4410400390625, 3.57080078125, 3.7005615234375, 3.830322265625, 3.9600830078125, 4.08984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 5.0, 7.0, 5.0, 12.0, 9.0, 15.0, 18.0, 22.0, 20.0, 30.0, 42.0, 71.0, 74.0, 74.0, 80.0, 77.0, 82.0, 68.0, 59.0, 52.0, 37.0, 41.0, 17.0, 14.0, 17.0, 16.0, 7.0, 8.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004391670227050781, -0.00042442232370376587, -0.0004096776247024536, -0.00039493292570114136, -0.0003801882266998291, -0.00036544352769851685, -0.0003506988286972046, -0.00033595412969589233, -0.0003212094306945801, -0.0003064647316932678, -0.00029172003269195557, -0.0002769753336906433, -0.00026223063468933105, -0.0002474859356880188, -0.00023274123668670654, -0.0002179965376853943, -0.00020325183868408203, -0.00018850713968276978, -0.00017376244068145752, -0.00015901774168014526, -0.000144273042678833, -0.00012952834367752075, -0.0001147836446762085, -0.00010003894567489624, -8.529424667358398e-05, -7.054954767227173e-05, -5.580484867095947e-05, -4.106014966964722e-05, -2.631545066833496e-05, -1.1570751667022705e-05, 3.1739473342895508e-06, 1.7918646335601807e-05, 3.266334533691406e-05, 4.740804433822632e-05, 6.215274333953857e-05, 7.689744234085083e-05, 9.164214134216309e-05, 0.00010638684034347534, 0.0001211315393447876, 0.00013587623834609985, 0.0001506209373474121, 0.00016536563634872437, 0.00018011033535003662, 0.00019485503435134888, 0.00020959973335266113, 0.0002243444323539734, 0.00023908913135528564, 0.0002538338303565979, 0.00026857852935791016, 0.0002833232283592224, 0.00029806792736053467, 0.0003128126263618469, 0.0003275573253631592, 0.00034230202436447144, 0.0003570467233657837, 0.00037179142236709595, 0.0003865361213684082, 0.00040128082036972046, 0.0004160255193710327, 0.00043077021837234497, 0.0004455149173736572, 0.0004602596163749695, 0.00047500431537628174, 0.000489749014377594, 0.0005044937133789062]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 5.0, 15.0, 17.0, 27.0, 32.0, 45.0, 66.0, 100.0, 153.0, 238.0, 339.0, 556.0, 820.0, 1240.0, 1984.0, 3029.0, 5194.0, 8543.0, 15116.0, 28148.0, 54869.0, 108086.0, 188857.0, 233325.0, 181642.0, 102454.0, 51419.0, 26477.0, 14349.0, 8056.0, 4823.0, 2983.0, 1933.0, 1177.0, 835.0, 546.0, 362.0, 225.0, 174.0, 91.0, 59.0, 54.0, 20.0, 24.0, 12.0, 15.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-4.35546875, -4.22528076171875, -4.0950927734375, -3.96490478515625, -3.834716796875, -3.70452880859375, -3.5743408203125, -3.44415283203125, -3.31396484375, -3.18377685546875, -3.0535888671875, -2.92340087890625, -2.793212890625, -2.66302490234375, -2.5328369140625, -2.40264892578125, -2.2724609375, -2.14227294921875, -2.0120849609375, -1.88189697265625, -1.751708984375, -1.62152099609375, -1.4913330078125, -1.36114501953125, -1.23095703125, -1.10076904296875, -0.9705810546875, -0.84039306640625, -0.710205078125, -0.58001708984375, -0.4498291015625, -0.31964111328125, -0.189453125, -0.05926513671875, 0.0709228515625, 0.20111083984375, 0.331298828125, 0.46148681640625, 0.5916748046875, 0.72186279296875, 0.85205078125, 0.98223876953125, 1.1124267578125, 1.24261474609375, 1.372802734375, 1.50299072265625, 1.6331787109375, 1.76336669921875, 1.8935546875, 2.02374267578125, 2.1539306640625, 2.28411865234375, 2.414306640625, 2.54449462890625, 2.6746826171875, 2.80487060546875, 2.93505859375, 3.06524658203125, 3.1954345703125, 3.32562255859375, 3.455810546875, 3.58599853515625, 3.7161865234375, 3.84637451171875, 3.9765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 7.0, 7.0, 3.0, 6.0, 5.0, 9.0, 7.0, 13.0, 14.0, 18.0, 29.0, 29.0, 38.0, 40.0, 57.0, 61.0, 58.0, 61.0, 50.0, 63.0, 56.0, 47.0, 59.0, 55.0, 38.0, 29.0, 34.0, 27.0, 17.0, 8.0, 15.0, 19.0, 8.0, 2.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2763671875, -1.23614501953125, -1.1959228515625, -1.15570068359375, -1.115478515625, -1.07525634765625, -1.0350341796875, -0.99481201171875, -0.95458984375, -0.91436767578125, -0.8741455078125, -0.83392333984375, -0.793701171875, -0.75347900390625, -0.7132568359375, -0.67303466796875, -0.6328125, -0.59259033203125, -0.5523681640625, -0.51214599609375, -0.471923828125, -0.43170166015625, -0.3914794921875, -0.35125732421875, -0.31103515625, -0.27081298828125, -0.2305908203125, -0.19036865234375, -0.150146484375, -0.10992431640625, -0.0697021484375, -0.02947998046875, 0.0107421875, 0.05096435546875, 0.0911865234375, 0.13140869140625, 0.171630859375, 0.21185302734375, 0.2520751953125, 0.29229736328125, 0.33251953125, 0.37274169921875, 0.4129638671875, 0.45318603515625, 0.493408203125, 0.53363037109375, 0.5738525390625, 0.61407470703125, 0.654296875, 0.69451904296875, 0.7347412109375, 0.77496337890625, 0.815185546875, 0.85540771484375, 0.8956298828125, 0.93585205078125, 0.97607421875, 1.01629638671875, 1.0565185546875, 1.09674072265625, 1.136962890625, 1.17718505859375, 1.2174072265625, 1.25762939453125, 1.2978515625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 8.0, 9.0, 7.0, 15.0, 13.0, 15.0, 23.0, 17.0, 18.0, 29.0, 41.0, 31.0, 47.0, 35.0, 53.0, 54.0, 36.0, 52.0, 53.0, 56.0, 57.0, 42.0, 45.0, 47.0, 24.0, 36.0, 21.0, 20.0, 20.0, 14.0, 11.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.583103179931641, -5.363656520843506, -5.144209861755371, -4.924763202667236, -4.705316543579102, -4.485869884490967, -4.266423225402832, -4.046976089477539, -3.8275296688079834, -3.6080830097198486, -3.388636350631714, -3.169189453125, -2.9497427940368652, -2.7302961349487305, -2.5108494758605957, -2.291402816772461, -2.071956157684326, -1.8525094985961914, -1.6330628395080566, -1.4136160612106323, -1.1941694021224976, -0.9747227430343628, -0.7552759647369385, -0.5358293056488037, -0.31638264656066895, -0.09693595767021179, 0.12251073122024536, 0.3419574499130249, 0.5614041090011597, 0.7808507680892944, 1.0002975463867188, 1.2197442054748535, 1.4391908645629883, 1.658637523651123, 1.8780841827392578, 2.0975308418273926, 2.3169775009155273, 2.536424160003662, 2.755871057510376, 2.9753177165985107, 3.1947643756866455, 3.4142110347747803, 3.633657693862915, 3.853104591369629, 4.072551250457764, 4.291997909545898, 4.511444568634033, 4.730891227722168, 4.950337886810303, 5.1697845458984375, 5.389231204986572, 5.608677864074707, 5.828124523162842, 6.047571182250977, 6.2670183181762695, 6.486464500427246, 6.705911636352539, 6.925358295440674, 7.144804954528809, 7.364251613616943, 7.583698272705078, 7.803144931793213, 8.022591590881348, 8.24203872680664, 8.461484909057617]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 3.0, 7.0, 7.0, 4.0, 10.0, 8.0, 8.0, 11.0, 14.0, 15.0, 28.0, 25.0, 32.0, 25.0, 28.0, 22.0, 29.0, 41.0, 38.0, 47.0, 35.0, 51.0, 42.0, 33.0, 38.0, 40.0, 26.0, 32.0, 34.0, 34.0, 22.0, 24.0, 25.0, 19.0, 17.0, 17.0, 15.0, 17.0, 10.0, 19.0, 9.0, 6.0, 6.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.365121364593506, -5.188601493835449, -5.012082099914551, -4.835562705993652, -4.659042835235596, -4.482522964477539, -4.306003570556641, -4.129484176635742, -3.9529643058776855, -3.776444673538208, -3.5999250411987305, -3.423405408859253, -3.2468857765197754, -3.070366144180298, -2.8938465118408203, -2.7173268795013428, -2.5408072471618652, -2.3642876148223877, -2.18776798248291, -2.0112483501434326, -1.834728717803955, -1.6582090854644775, -1.481689453125, -1.3051698207855225, -1.128650188446045, -0.9521305561065674, -0.7756109237670898, -0.5990912914276123, -0.42257165908813477, -0.24605202674865723, -0.06953239440917969, 0.10698723793029785, 0.2835068702697754, 0.46002650260925293, 0.6365461349487305, 0.813065767288208, 0.9895853996276855, 1.166105031967163, 1.3426246643066406, 1.5191442966461182, 1.6956639289855957, 1.8721835613250732, 2.048703193664551, 2.2252228260040283, 2.401742458343506, 2.5782620906829834, 2.754781723022461, 2.9313013553619385, 3.107820987701416, 3.2843406200408936, 3.460860252380371, 3.6373798847198486, 3.813899517059326, 3.9904191493988037, 4.166938781738281, 4.34345817565918, 4.519978046417236, 4.696497917175293, 4.873017311096191, 5.04953670501709, 5.2260565757751465, 5.402576446533203, 5.579095840454102, 5.755615234375, 5.932135105133057]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 16.0, 27.0, 35.0, 59.0, 69.0, 123.0, 166.0, 258.0, 399.0, 604.0, 977.0, 1598.0, 2769.0, 4610.0, 8546.0, 15827.0, 30966.0, 63131.0, 135812.0, 296881.0, 593814.0, 910361.0, 923713.0, 615174.0, 310188.0, 141576.0, 66059.0, 32338.0, 16657.0, 8818.0, 5039.0, 2883.0, 1749.0, 1097.0, 727.0, 414.0, 282.0, 177.0, 107.0, 74.0, 53.0, 55.0, 21.0, 8.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.30084228515625, -6.0977783203125, -5.89471435546875, -5.691650390625, -5.48858642578125, -5.2855224609375, -5.08245849609375, -4.87939453125, -4.67633056640625, -4.4732666015625, -4.27020263671875, -4.067138671875, -3.86407470703125, -3.6610107421875, -3.45794677734375, -3.2548828125, -3.05181884765625, -2.8487548828125, -2.64569091796875, -2.442626953125, -2.23956298828125, -2.0364990234375, -1.83343505859375, -1.63037109375, -1.42730712890625, -1.2242431640625, -1.02117919921875, -0.818115234375, -0.61505126953125, -0.4119873046875, -0.20892333984375, -0.005859375, 0.19720458984375, 0.4002685546875, 0.60333251953125, 0.806396484375, 1.00946044921875, 1.2125244140625, 1.41558837890625, 1.61865234375, 1.82171630859375, 2.0247802734375, 2.22784423828125, 2.430908203125, 2.63397216796875, 2.8370361328125, 3.04010009765625, 3.2431640625, 3.44622802734375, 3.6492919921875, 3.85235595703125, 4.055419921875, 4.25848388671875, 4.4615478515625, 4.66461181640625, 4.86767578125, 5.07073974609375, 5.2738037109375, 5.47686767578125, 5.679931640625, 5.88299560546875, 6.0860595703125, 6.28912353515625, 6.4921875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 2.0, 5.0, 6.0, 11.0, 9.0, 10.0, 10.0, 19.0, 12.0, 18.0, 21.0, 23.0, 23.0, 28.0, 32.0, 31.0, 25.0, 39.0, 52.0, 39.0, 36.0, 48.0, 44.0, 44.0, 44.0, 43.0, 38.0, 28.0, 30.0, 19.0, 24.0, 17.0, 13.0, 22.0, 21.0, 23.0, 15.0, 16.0, 9.0, 7.0, 9.0, 7.0, 5.0, 5.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.2877197265625, -4.134033203125, -3.9803466796875, -3.82666015625, -3.6729736328125, -3.519287109375, -3.3656005859375, -3.2119140625, -3.0582275390625, -2.904541015625, -2.7508544921875, -2.59716796875, -2.4434814453125, -2.289794921875, -2.1361083984375, -1.982421875, -1.8287353515625, -1.675048828125, -1.5213623046875, -1.36767578125, -1.2139892578125, -1.060302734375, -0.9066162109375, -0.7529296875, -0.5992431640625, -0.445556640625, -0.2918701171875, -0.13818359375, 0.0155029296875, 0.169189453125, 0.3228759765625, 0.4765625, 0.6302490234375, 0.783935546875, 0.9376220703125, 1.09130859375, 1.2449951171875, 1.398681640625, 1.5523681640625, 1.7060546875, 1.8597412109375, 2.013427734375, 2.1671142578125, 2.32080078125, 2.4744873046875, 2.628173828125, 2.7818603515625, 2.935546875, 3.0892333984375, 3.242919921875, 3.3966064453125, 3.55029296875, 3.7039794921875, 3.857666015625, 4.0113525390625, 4.1650390625, 4.3187255859375, 4.472412109375, 4.6260986328125, 4.77978515625, 4.9334716796875, 5.087158203125, 5.2408447265625, 5.39453125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 5.0, 7.0, 15.0, 24.0, 26.0, 55.0, 101.0, 155.0, 229.0, 365.0, 692.0, 1156.0, 2089.0, 3988.0, 7443.0, 15333.0, 31893.0, 68701.0, 152811.0, 335953.0, 673263.0, 1017380.0, 907492.0, 519294.0, 246506.0, 110722.0, 50582.0, 23622.0, 11468.0, 5897.0, 3036.0, 1614.0, 926.0, 530.0, 314.0, 197.0, 130.0, 83.0, 59.0, 51.0, 25.0, 18.0, 10.0, 5.0, 5.0, 9.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.421875, -9.15869140625, -8.8955078125, -8.63232421875, -8.369140625, -8.10595703125, -7.8427734375, -7.57958984375, -7.31640625, -7.05322265625, -6.7900390625, -6.52685546875, -6.263671875, -6.00048828125, -5.7373046875, -5.47412109375, -5.2109375, -4.94775390625, -4.6845703125, -4.42138671875, -4.158203125, -3.89501953125, -3.6318359375, -3.36865234375, -3.10546875, -2.84228515625, -2.5791015625, -2.31591796875, -2.052734375, -1.78955078125, -1.5263671875, -1.26318359375, -1.0, -0.73681640625, -0.4736328125, -0.21044921875, 0.052734375, 0.31591796875, 0.5791015625, 0.84228515625, 1.10546875, 1.36865234375, 1.6318359375, 1.89501953125, 2.158203125, 2.42138671875, 2.6845703125, 2.94775390625, 3.2109375, 3.47412109375, 3.7373046875, 4.00048828125, 4.263671875, 4.52685546875, 4.7900390625, 5.05322265625, 5.31640625, 5.57958984375, 5.8427734375, 6.10595703125, 6.369140625, 6.63232421875, 6.8955078125, 7.15869140625, 7.421875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 11.0, 6.0, 8.0, 18.0, 22.0, 34.0, 35.0, 51.0, 79.0, 81.0, 93.0, 138.0, 160.0, 193.0, 235.0, 306.0, 311.0, 317.0, 302.0, 284.0, 249.0, 231.0, 202.0, 156.0, 144.0, 107.0, 81.0, 58.0, 43.0, 43.0, 25.0, 21.0, 11.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.888671875, -2.7978515625, -2.70703125, -2.6162109375, -2.525390625, -2.4345703125, -2.34375, -2.2529296875, -2.162109375, -2.0712890625, -1.98046875, -1.8896484375, -1.798828125, -1.7080078125, -1.6171875, -1.5263671875, -1.435546875, -1.3447265625, -1.25390625, -1.1630859375, -1.072265625, -0.9814453125, -0.890625, -0.7998046875, -0.708984375, -0.6181640625, -0.52734375, -0.4365234375, -0.345703125, -0.2548828125, -0.1640625, -0.0732421875, 0.017578125, 0.1083984375, 0.19921875, 0.2900390625, 0.380859375, 0.4716796875, 0.5625, 0.6533203125, 0.744140625, 0.8349609375, 0.92578125, 1.0166015625, 1.107421875, 1.1982421875, 1.2890625, 1.3798828125, 1.470703125, 1.5615234375, 1.65234375, 1.7431640625, 1.833984375, 1.9248046875, 2.015625, 2.1064453125, 2.197265625, 2.2880859375, 2.37890625, 2.4697265625, 2.560546875, 2.6513671875, 2.7421875, 2.8330078125, 2.923828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 3.0, 5.0, 8.0, 9.0, 15.0, 19.0, 19.0, 18.0, 19.0, 36.0, 29.0, 28.0, 25.0, 34.0, 51.0, 55.0, 41.0, 51.0, 51.0, 34.0, 40.0, 45.0, 49.0, 45.0, 36.0, 38.0, 29.0, 26.0, 25.0, 22.0, 14.0, 14.0, 15.0, 7.0, 9.0, 5.0, 5.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.112536907196045, -5.9177680015563965, -5.722999095916748, -5.5282301902771, -5.333461284637451, -5.138692855834961, -4.9439239501953125, -4.749155044555664, -4.554386138916016, -4.359617233276367, -4.164848327636719, -3.9700794219970703, -3.775310754776001, -3.5805418491363525, -3.385772943496704, -3.1910042762756348, -2.9962351322174072, -2.801466226577759, -2.6066973209381104, -2.411928653717041, -2.2171597480773926, -2.022390842437744, -1.8276219367980957, -1.6328531503677368, -1.4380842447280884, -1.24331533908844, -1.048546552658081, -0.8537776470184326, -0.659008800983429, -0.4642399549484253, -0.26947104930877686, -0.07470226287841797, 0.12006664276123047, 0.31483548879623413, 0.5096043348312378, 0.7043732404708862, 0.8991420865058899, 1.0939109325408936, 1.288679838180542, 1.4834486246109009, 1.6782175302505493, 1.8729864358901978, 2.0677552223205566, 2.262524127960205, 2.4572930335998535, 2.652061939239502, 2.8468308448791504, 3.0415995121002197, 3.236368417739868, 3.4311373233795166, 3.625906229019165, 3.8206748962402344, 4.015443801879883, 4.210212707519531, 4.40498161315918, 4.599750518798828, 4.794519424438477, 4.989288330078125, 5.184057235717773, 5.378826141357422, 5.57359504699707, 5.768363952636719, 5.963132858276367, 6.157901287078857, 6.352670192718506]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 8.0, 3.0, 12.0, 5.0, 13.0, 17.0, 15.0, 25.0, 30.0, 18.0, 28.0, 20.0, 32.0, 42.0, 35.0, 39.0, 37.0, 34.0, 46.0, 38.0, 41.0, 43.0, 35.0, 33.0, 43.0, 35.0, 29.0, 19.0, 31.0, 24.0, 24.0, 24.0, 13.0, 15.0, 18.0, 11.0, 12.0, 4.0, 8.0, 12.0, 6.0, 5.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.838825225830078, -4.665224075317383, -4.4916229248046875, -4.31802225112915, -4.144421100616455, -3.9708199501037598, -3.7972190380096436, -3.6236181259155273, -3.450016975402832, -3.2764158248901367, -3.1028149127960205, -2.9292140007019043, -2.755612850189209, -2.5820116996765137, -2.4084107875823975, -2.2348098754882812, -2.061208724975586, -1.8876076936721802, -1.7140066623687744, -1.5404056310653687, -1.366804599761963, -1.1932035684585571, -1.0196025371551514, -0.8460015058517456, -0.6724004745483398, -0.4987994432449341, -0.3251984119415283, -0.15159738063812256, 0.022003650665283203, 0.19560468196868896, 0.3692057132720947, 0.5428067445755005, 0.7164077758789062, 0.890008807182312, 1.0636098384857178, 1.2372108697891235, 1.4108119010925293, 1.584412932395935, 1.7580139636993408, 1.9316149950027466, 2.1052160263061523, 2.2788171768188477, 2.452418088912964, 2.62601900100708, 2.7996201515197754, 2.9732213020324707, 3.146822214126587, 3.320423126220703, 3.4940242767333984, 3.6676254272460938, 3.84122633934021, 4.014827251434326, 4.1884284019470215, 4.362029552459717, 4.535630226135254, 4.709231376647949, 4.8828325271606445, 5.05643367767334, 5.230034828186035, 5.403635501861572, 5.577236652374268, 5.750837802886963, 5.9244384765625, 6.098039627075195, 6.271640777587891]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 15.0, 26.0, 28.0, 38.0, 51.0, 84.0, 124.0, 142.0, 239.0, 423.0, 627.0, 954.0, 1578.0, 2731.0, 4827.0, 8458.0, 15394.0, 28723.0, 53009.0, 97454.0, 163352.0, 213463.0, 187933.0, 120719.0, 67234.0, 36259.0, 19331.0, 10594.0, 5985.0, 3374.0, 2092.0, 1214.0, 746.0, 475.0, 279.0, 190.0, 143.0, 76.0, 53.0, 40.0, 28.0, 18.0, 16.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.361328125, -3.26971435546875, -3.1781005859375, -3.08648681640625, -2.994873046875, -2.90325927734375, -2.8116455078125, -2.72003173828125, -2.62841796875, -2.53680419921875, -2.4451904296875, -2.35357666015625, -2.261962890625, -2.17034912109375, -2.0787353515625, -1.98712158203125, -1.8955078125, -1.80389404296875, -1.7122802734375, -1.62066650390625, -1.529052734375, -1.43743896484375, -1.3458251953125, -1.25421142578125, -1.16259765625, -1.07098388671875, -0.9793701171875, -0.88775634765625, -0.796142578125, -0.70452880859375, -0.6129150390625, -0.52130126953125, -0.4296875, -0.33807373046875, -0.2464599609375, -0.15484619140625, -0.063232421875, 0.02838134765625, 0.1199951171875, 0.21160888671875, 0.30322265625, 0.39483642578125, 0.4864501953125, 0.57806396484375, 0.669677734375, 0.76129150390625, 0.8529052734375, 0.94451904296875, 1.0361328125, 1.12774658203125, 1.2193603515625, 1.31097412109375, 1.402587890625, 1.49420166015625, 1.5858154296875, 1.67742919921875, 1.76904296875, 1.86065673828125, 1.9522705078125, 2.04388427734375, 2.135498046875, 2.22711181640625, 2.3187255859375, 2.41033935546875, 2.501953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 9.0, 9.0, 14.0, 11.0, 11.0, 12.0, 20.0, 21.0, 20.0, 21.0, 20.0, 29.0, 30.0, 34.0, 28.0, 40.0, 40.0, 35.0, 43.0, 29.0, 45.0, 38.0, 35.0, 38.0, 31.0, 41.0, 31.0, 33.0, 30.0, 28.0, 21.0, 26.0, 16.0, 16.0, 12.0, 7.0, 13.0, 9.0, 10.0, 10.0, 6.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.4609375, -5.28753662109375, -5.1141357421875, -4.94073486328125, -4.767333984375, -4.59393310546875, -4.4205322265625, -4.24713134765625, -4.07373046875, -3.90032958984375, -3.7269287109375, -3.55352783203125, -3.380126953125, -3.20672607421875, -3.0333251953125, -2.85992431640625, -2.6865234375, -2.51312255859375, -2.3397216796875, -2.16632080078125, -1.992919921875, -1.81951904296875, -1.6461181640625, -1.47271728515625, -1.29931640625, -1.12591552734375, -0.9525146484375, -0.77911376953125, -0.605712890625, -0.43231201171875, -0.2589111328125, -0.08551025390625, 0.087890625, 0.26129150390625, 0.4346923828125, 0.60809326171875, 0.781494140625, 0.95489501953125, 1.1282958984375, 1.30169677734375, 1.47509765625, 1.64849853515625, 1.8218994140625, 1.99530029296875, 2.168701171875, 2.34210205078125, 2.5155029296875, 2.68890380859375, 2.8623046875, 3.03570556640625, 3.2091064453125, 3.38250732421875, 3.555908203125, 3.72930908203125, 3.9027099609375, 4.07611083984375, 4.24951171875, 4.42291259765625, 4.5963134765625, 4.76971435546875, 4.943115234375, 5.11651611328125, 5.2899169921875, 5.46331787109375, 5.63671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 17.0, 21.0, 14.0, 29.0, 50.0, 80.0, 86.0, 129.0, 184.0, 311.0, 436.0, 742.0, 1171.0, 1969.0, 3349.0, 5928.0, 10657.0, 19475.0, 45176.0, 700341.0, 193951.0, 29369.0, 15052.0, 8351.0, 4694.0, 2652.0, 1579.0, 940.0, 571.0, 403.0, 250.0, 179.0, 129.0, 84.0, 57.0, 44.0, 28.0, 20.0, 16.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.75, -6.55023193359375, -6.3504638671875, -6.15069580078125, -5.950927734375, -5.75115966796875, -5.5513916015625, -5.35162353515625, -5.15185546875, -4.95208740234375, -4.7523193359375, -4.55255126953125, -4.352783203125, -4.15301513671875, -3.9532470703125, -3.75347900390625, -3.5537109375, -3.35394287109375, -3.1541748046875, -2.95440673828125, -2.754638671875, -2.55487060546875, -2.3551025390625, -2.15533447265625, -1.95556640625, -1.75579833984375, -1.5560302734375, -1.35626220703125, -1.156494140625, -0.95672607421875, -0.7569580078125, -0.55718994140625, -0.357421875, -0.15765380859375, 0.0421142578125, 0.24188232421875, 0.441650390625, 0.64141845703125, 0.8411865234375, 1.04095458984375, 1.24072265625, 1.44049072265625, 1.6402587890625, 1.84002685546875, 2.039794921875, 2.23956298828125, 2.4393310546875, 2.63909912109375, 2.8388671875, 3.03863525390625, 3.2384033203125, 3.43817138671875, 3.637939453125, 3.83770751953125, 4.0374755859375, 4.23724365234375, 4.43701171875, 4.63677978515625, 4.8365478515625, 5.03631591796875, 5.236083984375, 5.43585205078125, 5.6356201171875, 5.83538818359375, 6.03515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 12.0, 15.0, 19.0, 26.0, 12.0, 25.0, 30.0, 32.0, 33.0, 35.0, 39.0, 41.0, 34.0, 45.0, 31.0, 39.0, 46.0, 46.0, 47.0, 37.0, 43.0, 39.0, 37.0, 30.0, 28.0, 30.0, 27.0, 14.0, 11.0, 17.0, 13.0, 14.0, 13.0, 10.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.60546875, -4.4522705078125, -4.299072265625, -4.1458740234375, -3.99267578125, -3.8394775390625, -3.686279296875, -3.5330810546875, -3.3798828125, -3.2266845703125, -3.073486328125, -2.9202880859375, -2.76708984375, -2.6138916015625, -2.460693359375, -2.3074951171875, -2.154296875, -2.0010986328125, -1.847900390625, -1.6947021484375, -1.54150390625, -1.3883056640625, -1.235107421875, -1.0819091796875, -0.9287109375, -0.7755126953125, -0.622314453125, -0.4691162109375, -0.31591796875, -0.1627197265625, -0.009521484375, 0.1436767578125, 0.296875, 0.4500732421875, 0.603271484375, 0.7564697265625, 0.90966796875, 1.0628662109375, 1.216064453125, 1.3692626953125, 1.5224609375, 1.6756591796875, 1.828857421875, 1.9820556640625, 2.13525390625, 2.2884521484375, 2.441650390625, 2.5948486328125, 2.748046875, 2.9012451171875, 3.054443359375, 3.2076416015625, 3.36083984375, 3.5140380859375, 3.667236328125, 3.8204345703125, 3.9736328125, 4.1268310546875, 4.280029296875, 4.4332275390625, 4.58642578125, 4.7396240234375, 4.892822265625, 5.0460205078125, 5.19921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 5.0, 8.0, 10.0, 14.0, 12.0, 18.0, 23.0, 36.0, 47.0, 66.0, 99.0, 153.0, 204.0, 309.0, 499.0, 727.0, 1143.0, 1897.0, 3525.0, 6567.0, 14035.0, 37938.0, 563726.0, 357147.0, 33069.0, 13002.0, 6016.0, 3258.0, 1803.0, 1087.0, 694.0, 452.0, 274.0, 198.0, 135.0, 89.0, 73.0, 45.0, 37.0, 32.0, 28.0, 14.0, 11.0, 7.0, 5.0, 1.0, 4.0, 0.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.927734375, -0.8995742797851562, -0.8714141845703125, -0.8432540893554688, -0.815093994140625, -0.7869338989257812, -0.7587738037109375, -0.7306137084960938, -0.70245361328125, -0.6742935180664062, -0.6461334228515625, -0.6179733276367188, -0.589813232421875, -0.5616531372070312, -0.5334930419921875, -0.5053329467773438, -0.4771728515625, -0.44901275634765625, -0.4208526611328125, -0.39269256591796875, -0.364532470703125, -0.33637237548828125, -0.3082122802734375, -0.28005218505859375, -0.25189208984375, -0.22373199462890625, -0.1955718994140625, -0.16741180419921875, -0.139251708984375, -0.11109161376953125, -0.0829315185546875, -0.05477142333984375, -0.026611328125, 0.00154876708984375, 0.0297088623046875, 0.05786895751953125, 0.086029052734375, 0.11418914794921875, 0.1423492431640625, 0.17050933837890625, 0.19866943359375, 0.22682952880859375, 0.2549896240234375, 0.28314971923828125, 0.311309814453125, 0.33946990966796875, 0.3676300048828125, 0.39579010009765625, 0.4239501953125, 0.45211029052734375, 0.4802703857421875, 0.5084304809570312, 0.536590576171875, 0.5647506713867188, 0.5929107666015625, 0.6210708618164062, 0.64923095703125, 0.6773910522460938, 0.7055511474609375, 0.7337112426757812, 0.761871337890625, 0.7900314331054688, 0.8181915283203125, 0.8463516235351562, 0.87451171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 5.0, 12.0, 15.0, 30.0, 57.0, 82.0, 124.0, 200.0, 175.0, 123.0, 64.0, 46.0, 29.0, 15.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020003318786621094, -0.00019354559481143951, -0.0001870580017566681, -0.00018057040870189667, -0.00017408281564712524, -0.00016759522259235382, -0.0001611076295375824, -0.00015462003648281097, -0.00014813244342803955, -0.00014164485037326813, -0.0001351572573184967, -0.00012866966426372528, -0.00012218207120895386, -0.00011569447815418243, -0.00010920688509941101, -0.00010271929204463959, -9.623169898986816e-05, -8.974410593509674e-05, -8.325651288032532e-05, -7.67689198255539e-05, -7.028132677078247e-05, -6.379373371601105e-05, -5.7306140661239624e-05, -5.08185476064682e-05, -4.433095455169678e-05, -3.7843361496925354e-05, -3.135576844215393e-05, -2.4868175387382507e-05, -1.8380582332611084e-05, -1.189298927783966e-05, -5.405396223068237e-06, 1.082196831703186e-06, 7.569789886474609e-06, 1.4057382941246033e-05, 2.0544975996017456e-05, 2.703256905078888e-05, 3.35201621055603e-05, 4.0007755160331726e-05, 4.649534821510315e-05, 5.298294126987457e-05, 5.9470534324645996e-05, 6.595812737941742e-05, 7.244572043418884e-05, 7.893331348896027e-05, 8.542090654373169e-05, 9.190849959850311e-05, 9.839609265327454e-05, 0.00010488368570804596, 0.00011137127876281738, 0.0001178588718175888, 0.00012434646487236023, 0.00013083405792713165, 0.00013732165098190308, 0.0001438092440366745, 0.00015029683709144592, 0.00015678443014621735, 0.00016327202320098877, 0.0001697596162557602, 0.00017624720931053162, 0.00018273480236530304, 0.00018922239542007446, 0.00019570998847484589, 0.0002021975815296173, 0.00020868517458438873, 0.00021517276763916016]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 14.0, 11.0, 16.0, 28.0, 45.0, 58.0, 86.0, 129.0, 207.0, 281.0, 424.0, 641.0, 1043.0, 1643.0, 2902.0, 5335.0, 10889.0, 24725.0, 61106.0, 150323.0, 279175.0, 269827.0, 138317.0, 55945.0, 23044.0, 10175.0, 5069.0, 2643.0, 1533.0, 987.0, 629.0, 429.0, 272.0, 192.0, 113.0, 92.0, 69.0, 42.0, 37.0, 22.0, 4.0, 16.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.6213455200195312, -0.6006011962890625, -0.5798568725585938, -0.559112548828125, -0.5383682250976562, -0.5176239013671875, -0.49687957763671875, -0.47613525390625, -0.45539093017578125, -0.4346466064453125, -0.41390228271484375, -0.393157958984375, -0.37241363525390625, -0.3516693115234375, -0.33092498779296875, -0.3101806640625, -0.28943634033203125, -0.2686920166015625, -0.24794769287109375, -0.227203369140625, -0.20645904541015625, -0.1857147216796875, -0.16497039794921875, -0.14422607421875, -0.12348175048828125, -0.1027374267578125, -0.08199310302734375, -0.061248779296875, -0.04050445556640625, -0.0197601318359375, 0.00098419189453125, 0.021728515625, 0.04247283935546875, 0.0632171630859375, 0.08396148681640625, 0.104705810546875, 0.12545013427734375, 0.1461944580078125, 0.16693878173828125, 0.18768310546875, 0.20842742919921875, 0.2291717529296875, 0.24991607666015625, 0.270660400390625, 0.29140472412109375, 0.3121490478515625, 0.33289337158203125, 0.3536376953125, 0.37438201904296875, 0.3951263427734375, 0.41587066650390625, 0.436614990234375, 0.45735931396484375, 0.4781036376953125, 0.49884796142578125, 0.51959228515625, 0.5403366088867188, 0.5610809326171875, 0.5818252563476562, 0.602569580078125, 0.6233139038085938, 0.6440582275390625, 0.6648025512695312, 0.685546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 8.0, 5.0, 4.0, 9.0, 14.0, 11.0, 16.0, 22.0, 45.0, 49.0, 60.0, 67.0, 70.0, 78.0, 67.0, 73.0, 77.0, 61.0, 60.0, 42.0, 39.0, 34.0, 16.0, 12.0, 22.0, 11.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2103271484375, -0.20296669006347656, -0.19560623168945312, -0.1882457733154297, -0.18088531494140625, -0.1735248565673828, -0.16616439819335938, -0.15880393981933594, -0.1514434814453125, -0.14408302307128906, -0.13672256469726562, -0.1293621063232422, -0.12200164794921875, -0.11464118957519531, -0.10728073120117188, -0.09992027282714844, -0.092559814453125, -0.08519935607910156, -0.07783889770507812, -0.07047843933105469, -0.06311798095703125, -0.05575752258300781, -0.048397064208984375, -0.04103660583496094, -0.0336761474609375, -0.026315689086914062, -0.018955230712890625, -0.011594772338867188, -0.00423431396484375, 0.0031261444091796875, 0.010486602783203125, 0.017847061157226562, 0.02520751953125, 0.03256797790527344, 0.039928436279296875, 0.04728889465332031, 0.05464935302734375, 0.06200981140136719, 0.06937026977539062, 0.07673072814941406, 0.0840911865234375, 0.09145164489746094, 0.09881210327148438, 0.10617256164550781, 0.11353302001953125, 0.12089347839355469, 0.12825393676757812, 0.13561439514160156, 0.142974853515625, 0.15033531188964844, 0.15769577026367188, 0.1650562286376953, 0.17241668701171875, 0.1797771453857422, 0.18713760375976562, 0.19449806213378906, 0.2018585205078125, 0.20921897888183594, 0.21657943725585938, 0.2239398956298828, 0.23130035400390625, 0.2386608123779297, 0.24602127075195312, 0.25338172912597656, 0.2607421875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 11.0, 9.0, 15.0, 18.0, 24.0, 25.0, 27.0, 38.0, 34.0, 39.0, 49.0, 44.0, 60.0, 56.0, 52.0, 41.0, 56.0, 49.0, 61.0, 39.0, 37.0, 37.0, 30.0, 33.0, 18.0, 5.0, 19.0, 18.0, 7.0, 4.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7627434730529785, -6.54760217666626, -6.332461357116699, -6.1173200607299805, -5.90217924118042, -5.687037944793701, -5.471897125244141, -5.256755828857422, -5.041614532470703, -4.826473236083984, -4.611332416534424, -4.396191120147705, -4.1810503005981445, -3.965909004211426, -3.750767946243286, -3.5356268882751465, -3.320485830307007, -3.105344772338867, -2.8902037143707275, -2.675062656402588, -2.459921360015869, -2.2447803020477295, -2.02963924407959, -1.8144980669021606, -1.599357008934021, -1.3842159509658813, -1.1690747737884521, -0.9539337158203125, -0.7387925982475281, -0.5236514806747437, -0.308510422706604, -0.0933692455291748, 0.12177181243896484, 0.33691293001174927, 0.5520540475845337, 0.7671951055526733, 0.9823362231254578, 1.1974773406982422, 1.4126183986663818, 1.627759575843811, 1.8429006338119507, 2.05804181098938, 2.2731828689575195, 2.488323926925659, 2.703464984893799, 2.9186062812805176, 3.133747100830078, 3.348888397216797, 3.5640294551849365, 3.779170513153076, 3.994311571121216, 4.2094526290893555, 4.424593925476074, 4.639735221862793, 4.8548760414123535, 5.070017337799072, 5.285158157348633, 5.500299453735352, 5.715440273284912, 5.930581569671631, 6.145722389221191, 6.36086368560791, 6.576004981994629, 6.7911458015441895, 7.006287097930908]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 0.0, 3.0, 3.0, 7.0, 3.0, 10.0, 7.0, 9.0, 7.0, 20.0, 14.0, 25.0, 19.0, 30.0, 21.0, 24.0, 38.0, 30.0, 38.0, 33.0, 37.0, 43.0, 40.0, 43.0, 44.0, 34.0, 33.0, 40.0, 39.0, 28.0, 29.0, 31.0, 25.0, 31.0, 23.0, 22.0, 17.0, 11.0, 20.0, 11.0, 11.0, 8.0, 9.0, 10.0, 6.0, 8.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.825692653656006, -4.654580593109131, -4.483469009399414, -4.312356948852539, -4.141245365142822, -3.9701333045959473, -3.7990214824676514, -3.6279096603393555, -3.4567978382110596, -3.2856860160827637, -3.1145741939544678, -2.943462371826172, -2.772350311279297, -2.60123872756958, -2.430126667022705, -2.259014844894409, -2.0879030227661133, -1.9167912006378174, -1.7456793785095215, -1.574567437171936, -1.4034556150436401, -1.2323437929153442, -1.0612318515777588, -0.8901200294494629, -0.719008207321167, -0.5478963851928711, -0.3767845034599304, -0.20567262172698975, -0.03456079959869385, 0.13655102252960205, 0.3076629638671875, 0.4787747859954834, 0.6498870849609375, 0.8209989070892334, 0.9921107888221741, 1.1632226705551147, 1.3343344926834106, 1.5054463148117065, 1.676558256149292, 1.847670078277588, 2.018781900405884, 2.1898937225341797, 2.3610055446624756, 2.5321173667907715, 2.7032294273376465, 2.8743410110473633, 3.0454530715942383, 3.216564893722534, 3.38767671585083, 3.558788537979126, 3.729900360107422, 3.901012420654297, 4.072124004364014, 4.243236064910889, 4.4143476486206055, 4.5854597091674805, 4.7565717697143555, 4.9276838302612305, 5.098795413970947, 5.269907474517822, 5.441019058227539, 5.612131118774414, 5.783243179321289, 5.954354763031006, 6.125466346740723]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 5.0, 6.0, 22.0, 30.0, 60.0, 80.0, 129.0, 181.0, 325.0, 507.0, 777.0, 1347.0, 2356.0, 3833.0, 6501.0, 11486.0, 20090.0, 35180.0, 60898.0, 98519.0, 141655.0, 169918.0, 163930.0, 127172.0, 84614.0, 51065.0, 28603.0, 16359.0, 9400.0, 5385.0, 3230.0, 1790.0, 1164.0, 691.0, 455.0, 262.0, 162.0, 115.0, 81.0, 54.0, 34.0, 25.0, 10.0, 16.0, 10.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.61114501953125, -5.4019775390625, -5.19281005859375, -4.983642578125, -4.77447509765625, -4.5653076171875, -4.35614013671875, -4.14697265625, -3.93780517578125, -3.7286376953125, -3.51947021484375, -3.310302734375, -3.10113525390625, -2.8919677734375, -2.68280029296875, -2.4736328125, -2.26446533203125, -2.0552978515625, -1.84613037109375, -1.636962890625, -1.42779541015625, -1.2186279296875, -1.00946044921875, -0.80029296875, -0.59112548828125, -0.3819580078125, -0.17279052734375, 0.036376953125, 0.24554443359375, 0.4547119140625, 0.66387939453125, 0.873046875, 1.08221435546875, 1.2913818359375, 1.50054931640625, 1.709716796875, 1.91888427734375, 2.1280517578125, 2.33721923828125, 2.54638671875, 2.75555419921875, 2.9647216796875, 3.17388916015625, 3.383056640625, 3.59222412109375, 3.8013916015625, 4.01055908203125, 4.2197265625, 4.42889404296875, 4.6380615234375, 4.84722900390625, 5.056396484375, 5.26556396484375, 5.4747314453125, 5.68389892578125, 5.89306640625, 6.10223388671875, 6.3114013671875, 6.52056884765625, 6.729736328125, 6.93890380859375, 7.1480712890625, 7.35723876953125, 7.56640625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 3.0, 9.0, 11.0, 10.0, 11.0, 20.0, 22.0, 20.0, 27.0, 28.0, 23.0, 23.0, 47.0, 14.0, 45.0, 42.0, 42.0, 44.0, 41.0, 43.0, 34.0, 39.0, 46.0, 39.0, 34.0, 30.0, 24.0, 27.0, 27.0, 26.0, 18.0, 16.0, 16.0, 13.0, 11.0, 12.0, 14.0, 10.0, 6.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84375, -4.67071533203125, -4.4976806640625, -4.32464599609375, -4.151611328125, -3.97857666015625, -3.8055419921875, -3.63250732421875, -3.45947265625, -3.28643798828125, -3.1134033203125, -2.94036865234375, -2.767333984375, -2.59429931640625, -2.4212646484375, -2.24822998046875, -2.0751953125, -1.90216064453125, -1.7291259765625, -1.55609130859375, -1.383056640625, -1.21002197265625, -1.0369873046875, -0.86395263671875, -0.69091796875, -0.51788330078125, -0.3448486328125, -0.17181396484375, 0.001220703125, 0.17425537109375, 0.3472900390625, 0.52032470703125, 0.693359375, 0.86639404296875, 1.0394287109375, 1.21246337890625, 1.385498046875, 1.55853271484375, 1.7315673828125, 1.90460205078125, 2.07763671875, 2.25067138671875, 2.4237060546875, 2.59674072265625, 2.769775390625, 2.94281005859375, 3.1158447265625, 3.28887939453125, 3.4619140625, 3.63494873046875, 3.8079833984375, 3.98101806640625, 4.154052734375, 4.32708740234375, 4.5001220703125, 4.67315673828125, 4.84619140625, 5.01922607421875, 5.1922607421875, 5.36529541015625, 5.538330078125, 5.71136474609375, 5.8843994140625, 6.05743408203125, 6.23046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 13.0, 13.0, 23.0, 49.0, 64.0, 112.0, 168.0, 262.0, 422.0, 672.0, 1012.0, 1790.0, 2916.0, 4595.0, 7946.0, 13306.0, 22882.0, 38296.0, 61231.0, 94727.0, 130475.0, 155605.0, 153773.0, 125569.0, 88642.0, 56973.0, 35119.0, 20934.0, 12304.0, 7434.0, 4431.0, 2669.0, 1528.0, 990.0, 588.0, 358.0, 230.0, 146.0, 100.0, 64.0, 43.0, 23.0, 18.0, 12.0, 10.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.63671875, -6.43511962890625, -6.2335205078125, -6.03192138671875, -5.830322265625, -5.62872314453125, -5.4271240234375, -5.22552490234375, -5.02392578125, -4.82232666015625, -4.6207275390625, -4.41912841796875, -4.217529296875, -4.01593017578125, -3.8143310546875, -3.61273193359375, -3.4111328125, -3.20953369140625, -3.0079345703125, -2.80633544921875, -2.604736328125, -2.40313720703125, -2.2015380859375, -1.99993896484375, -1.79833984375, -1.59674072265625, -1.3951416015625, -1.19354248046875, -0.991943359375, -0.79034423828125, -0.5887451171875, -0.38714599609375, -0.185546875, 0.01605224609375, 0.2176513671875, 0.41925048828125, 0.620849609375, 0.82244873046875, 1.0240478515625, 1.22564697265625, 1.42724609375, 1.62884521484375, 1.8304443359375, 2.03204345703125, 2.233642578125, 2.43524169921875, 2.6368408203125, 2.83843994140625, 3.0400390625, 3.24163818359375, 3.4432373046875, 3.64483642578125, 3.846435546875, 4.04803466796875, 4.2496337890625, 4.45123291015625, 4.65283203125, 4.85443115234375, 5.0560302734375, 5.25762939453125, 5.459228515625, 5.66082763671875, 5.8624267578125, 6.06402587890625, 6.265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 9.0, 4.0, 11.0, 12.0, 12.0, 14.0, 19.0, 20.0, 18.0, 14.0, 26.0, 28.0, 33.0, 32.0, 27.0, 26.0, 38.0, 35.0, 37.0, 50.0, 39.0, 38.0, 40.0, 41.0, 46.0, 31.0, 46.0, 31.0, 34.0, 18.0, 22.0, 21.0, 23.0, 16.0, 19.0, 13.0, 8.0, 13.0, 8.0, 8.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.607421875, -3.497039794921875, -3.38665771484375, -3.276275634765625, -3.1658935546875, -3.055511474609375, -2.94512939453125, -2.834747314453125, -2.724365234375, -2.613983154296875, -2.50360107421875, -2.393218994140625, -2.2828369140625, -2.172454833984375, -2.06207275390625, -1.951690673828125, -1.84130859375, -1.730926513671875, -1.62054443359375, -1.510162353515625, -1.3997802734375, -1.289398193359375, -1.17901611328125, -1.068634033203125, -0.958251953125, -0.847869873046875, -0.73748779296875, -0.627105712890625, -0.5167236328125, -0.406341552734375, -0.29595947265625, -0.185577392578125, -0.0751953125, 0.035186767578125, 0.14556884765625, 0.255950927734375, 0.3663330078125, 0.476715087890625, 0.58709716796875, 0.697479248046875, 0.807861328125, 0.918243408203125, 1.02862548828125, 1.139007568359375, 1.2493896484375, 1.359771728515625, 1.47015380859375, 1.580535888671875, 1.69091796875, 1.801300048828125, 1.91168212890625, 2.022064208984375, 2.1324462890625, 2.242828369140625, 2.35321044921875, 2.463592529296875, 2.573974609375, 2.684356689453125, 2.79473876953125, 2.905120849609375, 3.0155029296875, 3.125885009765625, 3.23626708984375, 3.346649169921875, 3.45703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 3.0, 4.0, 7.0, 15.0, 28.0, 34.0, 66.0, 87.0, 166.0, 217.0, 397.0, 701.0, 1162.0, 2069.0, 3566.0, 7099.0, 13867.0, 28636.0, 60307.0, 124743.0, 214307.0, 244968.0, 172428.0, 89202.0, 42487.0, 20170.0, 10104.0, 5199.0, 2756.0, 1499.0, 915.0, 520.0, 326.0, 166.0, 128.0, 73.0, 61.0, 23.0, 14.0, 15.0, 6.0, 9.0, 5.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.546844482421875, -4.41790771484375, -4.288970947265625, -4.1600341796875, -4.031097412109375, -3.90216064453125, -3.773223876953125, -3.644287109375, -3.515350341796875, -3.38641357421875, -3.257476806640625, -3.1285400390625, -2.999603271484375, -2.87066650390625, -2.741729736328125, -2.61279296875, -2.483856201171875, -2.35491943359375, -2.225982666015625, -2.0970458984375, -1.968109130859375, -1.83917236328125, -1.710235595703125, -1.581298828125, -1.452362060546875, -1.32342529296875, -1.194488525390625, -1.0655517578125, -0.936614990234375, -0.80767822265625, -0.678741455078125, -0.5498046875, -0.420867919921875, -0.29193115234375, -0.162994384765625, -0.0340576171875, 0.094879150390625, 0.22381591796875, 0.352752685546875, 0.481689453125, 0.610626220703125, 0.73956298828125, 0.868499755859375, 0.9974365234375, 1.126373291015625, 1.25531005859375, 1.384246826171875, 1.51318359375, 1.642120361328125, 1.77105712890625, 1.899993896484375, 2.0289306640625, 2.157867431640625, 2.28680419921875, 2.415740966796875, 2.544677734375, 2.673614501953125, 2.80255126953125, 2.931488037109375, 3.0604248046875, 3.189361572265625, 3.31829833984375, 3.447235107421875, 3.576171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 22.0, 15.0, 20.0, 21.0, 30.0, 24.0, 45.0, 43.0, 58.0, 56.0, 64.0, 66.0, 57.0, 69.0, 71.0, 50.0, 49.0, 43.0, 30.0, 34.0, 22.0, 16.0, 10.0, 8.0, 11.0, 5.0, 8.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0003609657287597656, -0.00035040080547332764, -0.00033983588218688965, -0.00032927095890045166, -0.00031870603561401367, -0.0003081411123275757, -0.0002975761890411377, -0.0002870112657546997, -0.0002764463424682617, -0.00026588141918182373, -0.00025531649589538574, -0.00024475157260894775, -0.00023418664932250977, -0.00022362172603607178, -0.0002130568027496338, -0.0002024918794631958, -0.0001919269561767578, -0.00018136203289031982, -0.00017079710960388184, -0.00016023218631744385, -0.00014966726303100586, -0.00013910233974456787, -0.00012853741645812988, -0.0001179724931716919, -0.0001074075698852539, -9.684264659881592e-05, -8.627772331237793e-05, -7.571280002593994e-05, -6.514787673950195e-05, -5.4582953453063965e-05, -4.4018030166625977e-05, -3.345310688018799e-05, -2.288818359375e-05, -1.2323260307312012e-05, -1.7583370208740234e-06, 8.806586265563965e-06, 1.9371509552001953e-05, 2.993643283843994e-05, 4.050135612487793e-05, 5.106627941131592e-05, 6.16312026977539e-05, 7.21961259841919e-05, 8.276104927062988e-05, 9.332597255706787e-05, 0.00010389089584350586, 0.00011445581912994385, 0.00012502074241638184, 0.00013558566570281982, 0.0001461505889892578, 0.0001567155122756958, 0.0001672804355621338, 0.00017784535884857178, 0.00018841028213500977, 0.00019897520542144775, 0.00020954012870788574, 0.00022010505199432373, 0.00023066997528076172, 0.0002412348985671997, 0.0002517998218536377, 0.0002623647451400757, 0.00027292966842651367, 0.00028349459171295166, 0.00029405951499938965, 0.00030462443828582764, 0.0003151893615722656]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 8.0, 4.0, 10.0, 14.0, 13.0, 20.0, 34.0, 48.0, 64.0, 101.0, 129.0, 237.0, 310.0, 447.0, 697.0, 1030.0, 1621.0, 2525.0, 3793.0, 6311.0, 10295.0, 16696.0, 27692.0, 47013.0, 75466.0, 113004.0, 148562.0, 161881.0, 143823.0, 106812.0, 69863.0, 43042.0, 25895.0, 15444.0, 9458.0, 5704.0, 3683.0, 2281.0, 1506.0, 958.0, 624.0, 396.0, 321.0, 215.0, 145.0, 147.0, 68.0, 49.0, 27.0, 21.0, 20.0, 12.0, 14.0, 7.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.5625, -2.48345947265625, -2.4044189453125, -2.32537841796875, -2.246337890625, -2.16729736328125, -2.0882568359375, -2.00921630859375, -1.93017578125, -1.85113525390625, -1.7720947265625, -1.69305419921875, -1.614013671875, -1.53497314453125, -1.4559326171875, -1.37689208984375, -1.2978515625, -1.21881103515625, -1.1397705078125, -1.06072998046875, -0.981689453125, -0.90264892578125, -0.8236083984375, -0.74456787109375, -0.66552734375, -0.58648681640625, -0.5074462890625, -0.42840576171875, -0.349365234375, -0.27032470703125, -0.1912841796875, -0.11224365234375, -0.033203125, 0.04583740234375, 0.1248779296875, 0.20391845703125, 0.282958984375, 0.36199951171875, 0.4410400390625, 0.52008056640625, 0.59912109375, 0.67816162109375, 0.7572021484375, 0.83624267578125, 0.915283203125, 0.99432373046875, 1.0733642578125, 1.15240478515625, 1.2314453125, 1.31048583984375, 1.3895263671875, 1.46856689453125, 1.547607421875, 1.62664794921875, 1.7056884765625, 1.78472900390625, 1.86376953125, 1.94281005859375, 2.0218505859375, 2.10089111328125, 2.179931640625, 2.25897216796875, 2.3380126953125, 2.41705322265625, 2.49609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 8.0, 8.0, 8.0, 7.0, 9.0, 18.0, 24.0, 27.0, 30.0, 41.0, 44.0, 47.0, 49.0, 64.0, 55.0, 47.0, 51.0, 53.0, 51.0, 37.0, 45.0, 34.0, 37.0, 41.0, 37.0, 28.0, 19.0, 11.0, 16.0, 9.0, 7.0, 7.0, 9.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.267578125, -1.23333740234375, -1.1990966796875, -1.16485595703125, -1.130615234375, -1.09637451171875, -1.0621337890625, -1.02789306640625, -0.99365234375, -0.95941162109375, -0.9251708984375, -0.89093017578125, -0.856689453125, -0.82244873046875, -0.7882080078125, -0.75396728515625, -0.7197265625, -0.68548583984375, -0.6512451171875, -0.61700439453125, -0.582763671875, -0.54852294921875, -0.5142822265625, -0.48004150390625, -0.44580078125, -0.41156005859375, -0.3773193359375, -0.34307861328125, -0.308837890625, -0.27459716796875, -0.2403564453125, -0.20611572265625, -0.171875, -0.13763427734375, -0.1033935546875, -0.06915283203125, -0.034912109375, -0.00067138671875, 0.0335693359375, 0.06781005859375, 0.10205078125, 0.13629150390625, 0.1705322265625, 0.20477294921875, 0.239013671875, 0.27325439453125, 0.3074951171875, 0.34173583984375, 0.3759765625, 0.41021728515625, 0.4444580078125, 0.47869873046875, 0.512939453125, 0.54718017578125, 0.5814208984375, 0.61566162109375, 0.64990234375, 0.68414306640625, 0.7183837890625, 0.75262451171875, 0.786865234375, 0.82110595703125, 0.8553466796875, 0.88958740234375, 0.923828125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 9.0, 7.0, 8.0, 6.0, 18.0, 21.0, 18.0, 33.0, 36.0, 42.0, 39.0, 53.0, 41.0, 67.0, 48.0, 60.0, 65.0, 58.0, 49.0, 44.0, 52.0, 48.0, 27.0, 30.0, 26.0, 19.0, 21.0, 18.0, 9.0, 7.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.047542572021484, -7.808728218078613, -7.569913864135742, -7.331099510192871, -7.09228515625, -6.853470802307129, -6.614656448364258, -6.375842094421387, -6.137027740478516, -5.8982133865356445, -5.659399032592773, -5.420584678649902, -5.181770324707031, -4.94295597076416, -4.704141616821289, -4.465327262878418, -4.226512908935547, -3.987698554992676, -3.7488842010498047, -3.5100698471069336, -3.2712554931640625, -3.0324411392211914, -2.7936267852783203, -2.554812431335449, -2.315998077392578, -2.077183723449707, -1.838369369506836, -1.5995550155639648, -1.3607406616210938, -1.1219263076782227, -0.8831119537353516, -0.6442975997924805, -0.4054832458496094, -0.16666889190673828, 0.07214546203613281, 0.3109598159790039, 0.549774169921875, 0.7885885238647461, 1.0274028778076172, 1.2662172317504883, 1.5050315856933594, 1.7438459396362305, 1.9826602935791016, 2.2214746475219727, 2.4602890014648438, 2.699103355407715, 2.937917709350586, 3.176732063293457, 3.415546417236328, 3.654360771179199, 3.8931751251220703, 4.131989479064941, 4.3708038330078125, 4.609618186950684, 4.848432540893555, 5.087246894836426, 5.326061248779297, 5.564875602722168, 5.803689956665039, 6.04250431060791, 6.281318664550781, 6.520133018493652, 6.758947372436523, 6.9977617263793945, 7.236576080322266]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 7.0, 16.0, 16.0, 12.0, 14.0, 10.0, 21.0, 25.0, 37.0, 37.0, 38.0, 41.0, 29.0, 33.0, 33.0, 40.0, 41.0, 52.0, 34.0, 45.0, 38.0, 30.0, 39.0, 39.0, 27.0, 35.0, 25.0, 26.0, 19.0, 26.0, 21.0, 18.0, 16.0, 10.0, 6.0, 5.0, 6.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.926061630249023, -5.739451885223389, -5.552842617034912, -5.366232872009277, -5.179623603820801, -4.993013858795166, -4.806404113769531, -4.619794845581055, -4.433185577392578, -4.246575832366943, -4.059966564178467, -3.873356819152832, -3.6867475509643555, -3.5001378059387207, -3.313528299331665, -3.1269187927246094, -2.9403090476989746, -2.753699541091919, -2.5670900344848633, -2.3804802894592285, -2.193871021270752, -2.007261276245117, -1.8206517696380615, -1.6340422630310059, -1.4474327564239502, -1.2608232498168945, -1.0742137432098389, -0.8876041173934937, -0.700994610786438, -0.5143851041793823, -0.3277754783630371, -0.14116597175598145, 0.04544353485107422, 0.23205307126045227, 0.4186626076698303, 0.6052721738815308, 0.7918816804885864, 0.9784911870956421, 1.1651008129119873, 1.351710319519043, 1.5383198261260986, 1.7249293327331543, 1.91153883934021, 2.0981483459472656, 2.2847580909729004, 2.471367359161377, 2.6579771041870117, 2.8445866107940674, 3.031196117401123, 3.2178056240081787, 3.4044151306152344, 3.591024875640869, 3.7776341438293457, 3.9642438888549805, 4.150853157043457, 4.337462902069092, 4.524072647094727, 4.710682392120361, 4.897291660308838, 5.083901405334473, 5.270510673522949, 5.457120418548584, 5.643730163574219, 5.830339431762695, 6.016948699951172]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 6.0, 7.0, 14.0, 23.0, 35.0, 64.0, 93.0, 129.0, 223.0, 348.0, 636.0, 1002.0, 1606.0, 2825.0, 4781.0, 8673.0, 16097.0, 30409.0, 60219.0, 122671.0, 251800.0, 486196.0, 769200.0, 887084.0, 709974.0, 420109.0, 211679.0, 100980.0, 50639.0, 25327.0, 13575.0, 7632.0, 4248.0, 2406.0, 1444.0, 845.0, 522.0, 289.0, 173.0, 122.0, 62.0, 49.0, 23.0, 13.0, 12.0, 11.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.203125, -6.01727294921875, -5.8314208984375, -5.64556884765625, -5.459716796875, -5.27386474609375, -5.0880126953125, -4.90216064453125, -4.71630859375, -4.53045654296875, -4.3446044921875, -4.15875244140625, -3.972900390625, -3.78704833984375, -3.6011962890625, -3.41534423828125, -3.2294921875, -3.04364013671875, -2.8577880859375, -2.67193603515625, -2.486083984375, -2.30023193359375, -2.1143798828125, -1.92852783203125, -1.74267578125, -1.55682373046875, -1.3709716796875, -1.18511962890625, -0.999267578125, -0.81341552734375, -0.6275634765625, -0.44171142578125, -0.255859375, -0.07000732421875, 0.1158447265625, 0.30169677734375, 0.487548828125, 0.67340087890625, 0.8592529296875, 1.04510498046875, 1.23095703125, 1.41680908203125, 1.6026611328125, 1.78851318359375, 1.974365234375, 2.16021728515625, 2.3460693359375, 2.53192138671875, 2.7177734375, 2.90362548828125, 3.0894775390625, 3.27532958984375, 3.461181640625, 3.64703369140625, 3.8328857421875, 4.01873779296875, 4.20458984375, 4.39044189453125, 4.5762939453125, 4.76214599609375, 4.947998046875, 5.13385009765625, 5.3197021484375, 5.50555419921875, 5.69140625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 9.0, 10.0, 8.0, 12.0, 21.0, 18.0, 24.0, 18.0, 30.0, 29.0, 22.0, 25.0, 37.0, 36.0, 42.0, 34.0, 33.0, 25.0, 47.0, 41.0, 42.0, 52.0, 44.0, 24.0, 32.0, 24.0, 32.0, 31.0, 35.0, 32.0, 16.0, 15.0, 16.0, 19.0, 11.0, 9.0, 6.0, 6.0, 6.0, 6.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.41796875, -4.26251220703125, -4.1070556640625, -3.95159912109375, -3.796142578125, -3.64068603515625, -3.4852294921875, -3.32977294921875, -3.17431640625, -3.01885986328125, -2.8634033203125, -2.70794677734375, -2.552490234375, -2.39703369140625, -2.2415771484375, -2.08612060546875, -1.9306640625, -1.77520751953125, -1.6197509765625, -1.46429443359375, -1.308837890625, -1.15338134765625, -0.9979248046875, -0.84246826171875, -0.68701171875, -0.53155517578125, -0.3760986328125, -0.22064208984375, -0.065185546875, 0.09027099609375, 0.2457275390625, 0.40118408203125, 0.556640625, 0.71209716796875, 0.8675537109375, 1.02301025390625, 1.178466796875, 1.33392333984375, 1.4893798828125, 1.64483642578125, 1.80029296875, 1.95574951171875, 2.1112060546875, 2.26666259765625, 2.422119140625, 2.57757568359375, 2.7330322265625, 2.88848876953125, 3.0439453125, 3.19940185546875, 3.3548583984375, 3.51031494140625, 3.665771484375, 3.82122802734375, 3.9766845703125, 4.13214111328125, 4.28759765625, 4.44305419921875, 4.5985107421875, 4.75396728515625, 4.909423828125, 5.06488037109375, 5.2203369140625, 5.37579345703125, 5.53125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 14.0, 21.0, 27.0, 41.0, 43.0, 86.0, 125.0, 176.0, 258.0, 471.0, 687.0, 1102.0, 1791.0, 2963.0, 4944.0, 8501.0, 14715.0, 26105.0, 46722.0, 85330.0, 153324.0, 273329.0, 451929.0, 658993.0, 762387.0, 653395.0, 442733.0, 265007.0, 149780.0, 83078.0, 45242.0, 25659.0, 14373.0, 8317.0, 4835.0, 2956.0, 1775.0, 1080.0, 705.0, 438.0, 251.0, 212.0, 120.0, 84.0, 49.0, 32.0, 28.0, 16.0, 19.0, 4.0, 6.0, 7.0, 4.0, 0.0, 1.0, 1.0], "bins": [-6.23828125, -6.04620361328125, -5.8541259765625, -5.66204833984375, -5.469970703125, -5.27789306640625, -5.0858154296875, -4.89373779296875, -4.70166015625, -4.50958251953125, -4.3175048828125, -4.12542724609375, -3.933349609375, -3.74127197265625, -3.5491943359375, -3.35711669921875, -3.1650390625, -2.97296142578125, -2.7808837890625, -2.58880615234375, -2.396728515625, -2.20465087890625, -2.0125732421875, -1.82049560546875, -1.62841796875, -1.43634033203125, -1.2442626953125, -1.05218505859375, -0.860107421875, -0.66802978515625, -0.4759521484375, -0.28387451171875, -0.091796875, 0.10028076171875, 0.2923583984375, 0.48443603515625, 0.676513671875, 0.86859130859375, 1.0606689453125, 1.25274658203125, 1.44482421875, 1.63690185546875, 1.8289794921875, 2.02105712890625, 2.213134765625, 2.40521240234375, 2.5972900390625, 2.78936767578125, 2.9814453125, 3.17352294921875, 3.3656005859375, 3.55767822265625, 3.749755859375, 3.94183349609375, 4.1339111328125, 4.32598876953125, 4.51806640625, 4.71014404296875, 4.9022216796875, 5.09429931640625, 5.286376953125, 5.47845458984375, 5.6705322265625, 5.86260986328125, 6.0546875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 7.0, 2.0, 5.0, 3.0, 5.0, 8.0, 3.0, 7.0, 12.0, 18.0, 17.0, 18.0, 25.0, 41.0, 43.0, 48.0, 74.0, 76.0, 100.0, 102.0, 108.0, 135.0, 146.0, 181.0, 175.0, 237.0, 213.0, 186.0, 181.0, 236.0, 203.0, 170.0, 174.0, 176.0, 140.0, 108.0, 110.0, 82.0, 88.0, 72.0, 64.0, 56.0, 51.0, 35.0, 40.0, 21.0, 25.0, 12.0, 10.0, 2.0, 13.0, 5.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.013671875, -1.95074462890625, -1.8878173828125, -1.82489013671875, -1.761962890625, -1.69903564453125, -1.6361083984375, -1.57318115234375, -1.51025390625, -1.44732666015625, -1.3843994140625, -1.32147216796875, -1.258544921875, -1.19561767578125, -1.1326904296875, -1.06976318359375, -1.0068359375, -0.94390869140625, -0.8809814453125, -0.81805419921875, -0.755126953125, -0.69219970703125, -0.6292724609375, -0.56634521484375, -0.50341796875, -0.44049072265625, -0.3775634765625, -0.31463623046875, -0.251708984375, -0.18878173828125, -0.1258544921875, -0.06292724609375, 0.0, 0.06292724609375, 0.1258544921875, 0.18878173828125, 0.251708984375, 0.31463623046875, 0.3775634765625, 0.44049072265625, 0.50341796875, 0.56634521484375, 0.6292724609375, 0.69219970703125, 0.755126953125, 0.81805419921875, 0.8809814453125, 0.94390869140625, 1.0068359375, 1.06976318359375, 1.1326904296875, 1.19561767578125, 1.258544921875, 1.32147216796875, 1.3843994140625, 1.44732666015625, 1.51025390625, 1.57318115234375, 1.6361083984375, 1.69903564453125, 1.761962890625, 1.82489013671875, 1.8878173828125, 1.95074462890625, 2.013671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 10.0, 6.0, 5.0, 12.0, 9.0, 16.0, 22.0, 26.0, 30.0, 22.0, 40.0, 45.0, 44.0, 43.0, 71.0, 54.0, 52.0, 47.0, 52.0, 56.0, 41.0, 49.0, 42.0, 39.0, 29.0, 22.0, 20.0, 17.0, 17.0, 11.0, 15.0, 8.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.131368637084961, -6.9155449867248535, -6.699721336364746, -6.483897686004639, -6.268074035644531, -6.052250385284424, -5.836426734924316, -5.620603561401367, -5.404779434204102, -5.188955783843994, -4.973132133483887, -4.757308483123779, -4.541484832763672, -4.3256611824035645, -4.109837532043457, -3.8940141201019287, -3.6781907081604004, -3.462367057800293, -3.2465434074401855, -3.030719757080078, -2.8148961067199707, -2.5990724563598633, -2.383249044418335, -2.1674253940582275, -1.9516017436981201, -1.7357780933380127, -1.5199544429779053, -1.3041309118270874, -1.08830726146698, -0.8724836111068726, -0.6566600799560547, -0.44083642959594727, -0.22501277923583984, -0.00918915867805481, 0.20663446187973022, 0.42245805263519287, 0.6382817029953003, 0.8541053533554077, 1.0699288845062256, 1.285752534866333, 1.5015761852264404, 1.7173998355865479, 1.9332234859466553, 2.1490468978881836, 2.364870548248291, 2.5806941986083984, 2.796517848968506, 3.0123414993286133, 3.2281651496887207, 3.443988800048828, 3.6598124504089355, 3.875636100769043, 4.09145975112915, 4.307283401489258, 4.523106575012207, 4.738930702209473, 4.954753875732422, 5.170577526092529, 5.386401176452637, 5.602224826812744, 5.818048477172852, 6.033872127532959, 6.249695777893066, 6.465518951416016, 6.681343078613281]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 5.0, 6.0, 10.0, 9.0, 5.0, 9.0, 18.0, 17.0, 22.0, 20.0, 37.0, 24.0, 30.0, 37.0, 42.0, 23.0, 24.0, 33.0, 31.0, 40.0, 38.0, 39.0, 46.0, 40.0, 39.0, 38.0, 33.0, 39.0, 31.0, 26.0, 24.0, 25.0, 24.0, 15.0, 23.0, 13.0, 17.0, 8.0, 7.0, 10.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.20350456237793, -5.025732040405273, -4.847959518432617, -4.670186996459961, -4.492414474487305, -4.314641952514648, -4.136869430541992, -3.959097146987915, -3.781324625015259, -3.6035521030426025, -3.4257795810699463, -3.248007297515869, -3.070234775543213, -2.8924622535705566, -2.7146897315979004, -2.536917209625244, -2.359144687652588, -2.1813721656799316, -2.0035996437072754, -1.8258272409439087, -1.6480547189712524, -1.4702821969985962, -1.2925097942352295, -1.1147372722625732, -0.936964750289917, -0.7591922283172607, -0.5814197659492493, -0.4036473035812378, -0.22587478160858154, -0.04810225963592529, 0.1296701431274414, 0.30744266510009766, 0.4852156639099121, 0.6629881858825684, 0.8407606482505798, 1.0185331106185913, 1.1963056325912476, 1.3740781545639038, 1.5518505573272705, 1.7296230792999268, 1.907395601272583, 2.0851681232452393, 2.2629406452178955, 2.4407129287719727, 2.618485450744629, 2.796257972717285, 2.9740304946899414, 3.1518030166625977, 3.329575538635254, 3.50734806060791, 3.6851205825805664, 3.8628931045532227, 4.040665626525879, 4.218438148498535, 4.396210670471191, 4.573983192443848, 4.751755714416504, 4.92952823638916, 5.107300758361816, 5.285073280334473, 5.462845802307129, 5.640618324279785, 5.818390846252441, 5.996163368225098, 6.173935413360596]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 6.0, 7.0, 9.0, 24.0, 28.0, 36.0, 54.0, 84.0, 106.0, 148.0, 247.0, 404.0, 590.0, 936.0, 1548.0, 2496.0, 4046.0, 7127.0, 12189.0, 21078.0, 36420.0, 63249.0, 103072.0, 152784.0, 184099.0, 165673.0, 116954.0, 72803.0, 42795.0, 24626.0, 14063.0, 8176.0, 4758.0, 2981.0, 1807.0, 1137.0, 704.0, 442.0, 299.0, 193.0, 114.0, 72.0, 48.0, 40.0, 31.0, 13.0, 11.0, 11.0, 3.0, 3.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.072265625, -2.00677490234375, -1.9412841796875, -1.87579345703125, -1.810302734375, -1.74481201171875, -1.6793212890625, -1.61383056640625, -1.54833984375, -1.48284912109375, -1.4173583984375, -1.35186767578125, -1.286376953125, -1.22088623046875, -1.1553955078125, -1.08990478515625, -1.0244140625, -0.95892333984375, -0.8934326171875, -0.82794189453125, -0.762451171875, -0.69696044921875, -0.6314697265625, -0.56597900390625, -0.50048828125, -0.43499755859375, -0.3695068359375, -0.30401611328125, -0.238525390625, -0.17303466796875, -0.1075439453125, -0.04205322265625, 0.0234375, 0.08892822265625, 0.1544189453125, 0.21990966796875, 0.285400390625, 0.35089111328125, 0.4163818359375, 0.48187255859375, 0.54736328125, 0.61285400390625, 0.6783447265625, 0.74383544921875, 0.809326171875, 0.87481689453125, 0.9403076171875, 1.00579833984375, 1.0712890625, 1.13677978515625, 1.2022705078125, 1.26776123046875, 1.333251953125, 1.39874267578125, 1.4642333984375, 1.52972412109375, 1.59521484375, 1.66070556640625, 1.7261962890625, 1.79168701171875, 1.857177734375, 1.92266845703125, 1.9881591796875, 2.05364990234375, 2.119140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 8.0, 6.0, 8.0, 13.0, 9.0, 18.0, 15.0, 16.0, 28.0, 26.0, 34.0, 34.0, 34.0, 34.0, 34.0, 45.0, 36.0, 33.0, 37.0, 49.0, 41.0, 40.0, 33.0, 39.0, 36.0, 40.0, 38.0, 27.0, 36.0, 27.0, 24.0, 17.0, 22.0, 10.0, 9.0, 10.0, 4.0, 6.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.00390625, -5.8065185546875, -5.609130859375, -5.4117431640625, -5.21435546875, -5.0169677734375, -4.819580078125, -4.6221923828125, -4.4248046875, -4.2274169921875, -4.030029296875, -3.8326416015625, -3.63525390625, -3.4378662109375, -3.240478515625, -3.0430908203125, -2.845703125, -2.6483154296875, -2.450927734375, -2.2535400390625, -2.05615234375, -1.8587646484375, -1.661376953125, -1.4639892578125, -1.2666015625, -1.0692138671875, -0.871826171875, -0.6744384765625, -0.47705078125, -0.2796630859375, -0.082275390625, 0.1151123046875, 0.3125, 0.5098876953125, 0.707275390625, 0.9046630859375, 1.10205078125, 1.2994384765625, 1.496826171875, 1.6942138671875, 1.8916015625, 2.0889892578125, 2.286376953125, 2.4837646484375, 2.68115234375, 2.8785400390625, 3.075927734375, 3.2733154296875, 3.470703125, 3.6680908203125, 3.865478515625, 4.0628662109375, 4.26025390625, 4.4576416015625, 4.655029296875, 4.8524169921875, 5.0498046875, 5.2471923828125, 5.444580078125, 5.6419677734375, 5.83935546875, 6.0367431640625, 6.234130859375, 6.4315185546875, 6.62890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 11.0, 11.0, 20.0, 18.0, 23.0, 38.0, 66.0, 64.0, 139.0, 235.0, 370.0, 631.0, 1093.0, 2147.0, 4239.0, 8710.0, 18720.0, 50058.0, 835869.0, 81951.0, 22764.0, 10525.0, 5105.0, 2575.0, 1339.0, 702.0, 426.0, 247.0, 163.0, 88.0, 65.0, 38.0, 25.0, 24.0, 17.0, 18.0, 6.0, 7.0, 1.0, 0.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.8902587890625, -7.655517578125, -7.4207763671875, -7.18603515625, -6.9512939453125, -6.716552734375, -6.4818115234375, -6.2470703125, -6.0123291015625, -5.777587890625, -5.5428466796875, -5.30810546875, -5.0733642578125, -4.838623046875, -4.6038818359375, -4.369140625, -4.1343994140625, -3.899658203125, -3.6649169921875, -3.43017578125, -3.1954345703125, -2.960693359375, -2.7259521484375, -2.4912109375, -2.2564697265625, -2.021728515625, -1.7869873046875, -1.55224609375, -1.3175048828125, -1.082763671875, -0.8480224609375, -0.61328125, -0.3785400390625, -0.143798828125, 0.0909423828125, 0.32568359375, 0.5604248046875, 0.795166015625, 1.0299072265625, 1.2646484375, 1.4993896484375, 1.734130859375, 1.9688720703125, 2.20361328125, 2.4383544921875, 2.673095703125, 2.9078369140625, 3.142578125, 3.3773193359375, 3.612060546875, 3.8468017578125, 4.08154296875, 4.3162841796875, 4.551025390625, 4.7857666015625, 5.0205078125, 5.2552490234375, 5.489990234375, 5.7247314453125, 5.95947265625, 6.1942138671875, 6.428955078125, 6.6636962890625, 6.8984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 8.0, 6.0, 9.0, 9.0, 18.0, 15.0, 17.0, 15.0, 18.0, 30.0, 28.0, 33.0, 29.0, 50.0, 36.0, 32.0, 44.0, 48.0, 39.0, 46.0, 41.0, 40.0, 42.0, 40.0, 42.0, 28.0, 34.0, 45.0, 36.0, 30.0, 18.0, 11.0, 9.0, 14.0, 12.0, 7.0, 4.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.546875, -5.38726806640625, -5.2276611328125, -5.06805419921875, -4.908447265625, -4.74884033203125, -4.5892333984375, -4.42962646484375, -4.27001953125, -4.11041259765625, -3.9508056640625, -3.79119873046875, -3.631591796875, -3.47198486328125, -3.3123779296875, -3.15277099609375, -2.9931640625, -2.83355712890625, -2.6739501953125, -2.51434326171875, -2.354736328125, -2.19512939453125, -2.0355224609375, -1.87591552734375, -1.71630859375, -1.55670166015625, -1.3970947265625, -1.23748779296875, -1.077880859375, -0.91827392578125, -0.7586669921875, -0.59906005859375, -0.439453125, -0.27984619140625, -0.1202392578125, 0.03936767578125, 0.198974609375, 0.35858154296875, 0.5181884765625, 0.67779541015625, 0.83740234375, 0.99700927734375, 1.1566162109375, 1.31622314453125, 1.475830078125, 1.63543701171875, 1.7950439453125, 1.95465087890625, 2.1142578125, 2.27386474609375, 2.4334716796875, 2.59307861328125, 2.752685546875, 2.91229248046875, 3.0718994140625, 3.23150634765625, 3.39111328125, 3.55072021484375, 3.7103271484375, 3.86993408203125, 4.029541015625, 4.18914794921875, 4.3487548828125, 4.50836181640625, 4.66796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 10.0, 4.0, 8.0, 17.0, 20.0, 13.0, 27.0, 35.0, 45.0, 53.0, 64.0, 107.0, 127.0, 172.0, 226.0, 306.0, 466.0, 641.0, 904.0, 1258.0, 1925.0, 2916.0, 4540.0, 7198.0, 12316.0, 22399.0, 67877.0, 691966.0, 161860.0, 30573.0, 15067.0, 8782.0, 5463.0, 3611.0, 2305.0, 1485.0, 1027.0, 737.0, 509.0, 388.0, 297.0, 218.0, 158.0, 121.0, 77.0, 55.0, 54.0, 35.0, 25.0, 17.0, 19.0, 11.0, 9.0, 8.0, 7.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.469482421875, -0.4546661376953125, -0.439849853515625, -0.4250335693359375, -0.41021728515625, -0.3954010009765625, -0.380584716796875, -0.3657684326171875, -0.3509521484375, -0.3361358642578125, -0.321319580078125, -0.3065032958984375, -0.29168701171875, -0.2768707275390625, -0.262054443359375, -0.2472381591796875, -0.232421875, -0.2176055908203125, -0.202789306640625, -0.1879730224609375, -0.17315673828125, -0.1583404541015625, -0.143524169921875, -0.1287078857421875, -0.1138916015625, -0.0990753173828125, -0.084259033203125, -0.0694427490234375, -0.05462646484375, -0.0398101806640625, -0.024993896484375, -0.0101776123046875, 0.004638671875, 0.0194549560546875, 0.034271240234375, 0.0490875244140625, 0.06390380859375, 0.0787200927734375, 0.093536376953125, 0.1083526611328125, 0.1231689453125, 0.1379852294921875, 0.152801513671875, 0.1676177978515625, 0.18243408203125, 0.1972503662109375, 0.212066650390625, 0.2268829345703125, 0.24169921875, 0.2565155029296875, 0.271331787109375, 0.2861480712890625, 0.30096435546875, 0.3157806396484375, 0.330596923828125, 0.3454132080078125, 0.3602294921875, 0.3750457763671875, 0.389862060546875, 0.4046783447265625, 0.41949462890625, 0.4343109130859375, 0.449127197265625, 0.4639434814453125, 0.478759765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 11.0, 14.0, 16.0, 21.0, 23.0, 30.0, 32.0, 42.0, 51.0, 56.0, 61.0, 76.0, 70.0, 61.0, 59.0, 61.0, 53.0, 44.0, 35.0, 35.0, 26.0, 27.0, 17.0, 12.0, 9.0, 4.0, 9.0, 5.0, 8.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8100948333740234e-05, -4.625041037797928e-05, -4.439987242221832e-05, -4.254933446645737e-05, -4.069879651069641e-05, -3.8848258554935455e-05, -3.69977205991745e-05, -3.5147182643413544e-05, -3.329664468765259e-05, -3.144610673189163e-05, -2.9595568776130676e-05, -2.774503082036972e-05, -2.5894492864608765e-05, -2.404395490884781e-05, -2.2193416953086853e-05, -2.0342878997325897e-05, -1.849234104156494e-05, -1.6641803085803986e-05, -1.479126513004303e-05, -1.2940727174282074e-05, -1.1090189218521118e-05, -9.239651262760162e-06, -7.3891133069992065e-06, -5.538575351238251e-06, -3.688037395477295e-06, -1.8374994397163391e-06, 1.30385160446167e-08, 1.8635764718055725e-06, 3.7141144275665283e-06, 5.564652383327484e-06, 7.41519033908844e-06, 9.265728294849396e-06, 1.1116266250610352e-05, 1.2966804206371307e-05, 1.4817342162132263e-05, 1.666788011789322e-05, 1.8518418073654175e-05, 2.036895602941513e-05, 2.2219493985176086e-05, 2.4070031940937042e-05, 2.5920569896697998e-05, 2.7771107852458954e-05, 2.962164580821991e-05, 3.1472183763980865e-05, 3.332272171974182e-05, 3.517325967550278e-05, 3.702379763126373e-05, 3.887433558702469e-05, 4.0724873542785645e-05, 4.25754114985466e-05, 4.4425949454307556e-05, 4.627648741006851e-05, 4.812702536582947e-05, 4.9977563321590424e-05, 5.182810127735138e-05, 5.3678639233112335e-05, 5.552917718887329e-05, 5.737971514463425e-05, 5.92302531003952e-05, 6.108079105615616e-05, 6.293132901191711e-05, 6.478186696767807e-05, 6.663240492343903e-05, 6.848294287919998e-05, 7.033348083496094e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 9.0, 3.0, 9.0, 15.0, 32.0, 50.0, 73.0, 86.0, 139.0, 188.0, 255.0, 342.0, 616.0, 808.0, 1248.0, 2043.0, 3084.0, 4999.0, 8940.0, 17169.0, 35413.0, 75173.0, 146737.0, 224822.0, 225056.0, 148087.0, 76173.0, 36333.0, 17346.0, 9218.0, 5082.0, 3086.0, 1964.0, 1323.0, 866.0, 561.0, 391.0, 242.0, 175.0, 144.0, 100.0, 61.0, 29.0, 21.0, 21.0, 10.0, 12.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.476806640625, -0.4609184265136719, -0.44503021240234375, -0.4291419982910156, -0.4132537841796875, -0.3973655700683594, -0.38147735595703125, -0.3655891418457031, -0.349700927734375, -0.3338127136230469, -0.31792449951171875, -0.3020362854003906, -0.2861480712890625, -0.2702598571777344, -0.25437164306640625, -0.23848342895507812, -0.22259521484375, -0.20670700073242188, -0.19081878662109375, -0.17493057250976562, -0.1590423583984375, -0.14315414428710938, -0.12726593017578125, -0.11137771606445312, -0.095489501953125, -0.07960128784179688, -0.06371307373046875, -0.047824859619140625, -0.0319366455078125, -0.016048431396484375, -0.00016021728515625, 0.015727996826171875, 0.0316162109375, 0.047504425048828125, 0.06339263916015625, 0.07928085327148438, 0.0951690673828125, 0.11105728149414062, 0.12694549560546875, 0.14283370971679688, 0.158721923828125, 0.17461013793945312, 0.19049835205078125, 0.20638656616210938, 0.2222747802734375, 0.23816299438476562, 0.25405120849609375, 0.2699394226074219, 0.28582763671875, 0.3017158508300781, 0.31760406494140625, 0.3334922790527344, 0.3493804931640625, 0.3652687072753906, 0.38115692138671875, 0.3970451354980469, 0.412933349609375, 0.4288215637207031, 0.44470977783203125, 0.4605979919433594, 0.4764862060546875, 0.4923744201660156, 0.5082626342773438, 0.5241508483886719, 0.5400390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 9.0, 3.0, 13.0, 8.0, 15.0, 18.0, 29.0, 32.0, 29.0, 29.0, 38.0, 42.0, 39.0, 47.0, 41.0, 47.0, 55.0, 52.0, 42.0, 55.0, 34.0, 37.0, 42.0, 36.0, 32.0, 20.0, 29.0, 18.0, 19.0, 14.0, 14.0, 8.0, 3.0, 6.0, 3.0, 0.0, 4.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1480712890625, -0.14307403564453125, -0.1380767822265625, -0.13307952880859375, -0.128082275390625, -0.12308502197265625, -0.1180877685546875, -0.11309051513671875, -0.10809326171875, -0.10309600830078125, -0.0980987548828125, -0.09310150146484375, -0.088104248046875, -0.08310699462890625, -0.0781097412109375, -0.07311248779296875, -0.068115234375, -0.06311798095703125, -0.0581207275390625, -0.05312347412109375, -0.048126220703125, -0.04312896728515625, -0.0381317138671875, -0.03313446044921875, -0.02813720703125, -0.02313995361328125, -0.0181427001953125, -0.01314544677734375, -0.008148193359375, -0.00315093994140625, 0.0018463134765625, 0.00684356689453125, 0.0118408203125, 0.01683807373046875, 0.0218353271484375, 0.02683258056640625, 0.031829833984375, 0.03682708740234375, 0.0418243408203125, 0.04682159423828125, 0.05181884765625, 0.05681610107421875, 0.0618133544921875, 0.06681060791015625, 0.071807861328125, 0.07680511474609375, 0.0818023681640625, 0.08679962158203125, 0.091796875, 0.09679412841796875, 0.1017913818359375, 0.10678863525390625, 0.111785888671875, 0.11678314208984375, 0.1217803955078125, 0.12677764892578125, 0.13177490234375, 0.13677215576171875, 0.1417694091796875, 0.14676666259765625, 0.151763916015625, 0.15676116943359375, 0.1617584228515625, 0.16675567626953125, 0.1717529296875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 13.0, 14.0, 18.0, 28.0, 25.0, 38.0, 32.0, 51.0, 56.0, 52.0, 65.0, 58.0, 58.0, 62.0, 56.0, 43.0, 50.0, 47.0, 44.0, 31.0, 26.0, 18.0, 22.0, 12.0, 12.0, 15.0, 9.0, 3.0, 4.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.173572063446045, -6.939920902252197, -6.70626974105835, -6.47261905670166, -6.2389678955078125, -6.005316734313965, -5.771665573120117, -5.5380144119262695, -5.30436372756958, -5.070712566375732, -4.837061405181885, -4.603410720825195, -4.369759559631348, -4.1361083984375, -3.9024572372436523, -3.668806314468384, -3.435155153274536, -3.2015039920806885, -2.96785306930542, -2.7342019081115723, -2.5005509853363037, -2.266899824142456, -2.0332489013671875, -1.7995977401733398, -1.5659466981887817, -1.3322956562042236, -1.0986446142196655, -0.8649935126304626, -0.6313424706459045, -0.39769136905670166, -0.16404032707214355, 0.06961071491241455, 0.30326175689697266, 0.5369127988815308, 0.7705638408660889, 1.0042150020599365, 1.237865924835205, 1.4715170860290527, 1.7051681280136108, 1.938819169998169, 2.1724700927734375, 2.406121253967285, 2.6397721767425537, 2.8734233379364014, 3.10707426071167, 3.3407254219055176, 3.5743765830993652, 3.808027505874634, 4.041678428649902, 4.27532958984375, 4.508980751037598, 4.742631435394287, 4.976282596588135, 5.209933757781982, 5.44358491897583, 5.6772356033325195, 5.910887241363525, 6.144538402557373, 6.378189563751221, 6.61184024810791, 6.845491409301758, 7.0791425704956055, 7.312793731689453, 7.546444892883301, 7.78009557723999]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 15.0, 6.0, 4.0, 10.0, 19.0, 16.0, 17.0, 25.0, 27.0, 31.0, 29.0, 37.0, 33.0, 34.0, 17.0, 34.0, 36.0, 30.0, 40.0, 41.0, 46.0, 41.0, 37.0, 33.0, 35.0, 38.0, 38.0, 28.0, 23.0, 25.0, 20.0, 25.0, 17.0, 16.0, 13.0, 14.0, 8.0, 9.0, 7.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.959117412567139, -4.784794330596924, -4.610471248626709, -4.436148166656494, -4.261824607849121, -4.087501525878906, -3.9131784439086914, -3.7388553619384766, -3.5645322799682617, -3.390209197998047, -3.215886116027832, -3.041562795639038, -2.8672397136688232, -2.6929166316986084, -2.5185933113098145, -2.3442702293395996, -2.1699471473693848, -1.99562406539917, -1.8213008642196655, -1.6469776630401611, -1.4726545810699463, -1.2983314990997314, -1.124008297920227, -0.9496850967407227, -0.7753620147705078, -0.6010388731956482, -0.4267157316207886, -0.25239259004592896, -0.07806944847106934, 0.09625369310379028, 0.2705768346786499, 0.4449000358581543, 0.6192235946655273, 0.793546736240387, 0.9678698778152466, 1.142193078994751, 1.3165161609649658, 1.4908392429351807, 1.665162444114685, 1.8394856452941895, 2.0138087272644043, 2.188131809234619, 2.362454891204834, 2.536778211593628, 2.7111012935638428, 2.8854243755340576, 3.0597476959228516, 3.2340707778930664, 3.4083938598632812, 3.582716941833496, 3.757040023803711, 3.931363344192505, 4.105686187744141, 4.280009746551514, 4.4543328285217285, 4.628655910491943, 4.802978992462158, 4.977302074432373, 5.151625156402588, 5.325948238372803, 5.500271797180176, 5.674594879150391, 5.8489179611206055, 6.02324104309082, 6.197564125061035]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 11.0, 21.0, 27.0, 66.0, 78.0, 122.0, 194.0, 284.0, 530.0, 857.0, 1321.0, 2107.0, 3515.0, 5668.0, 9368.0, 15366.0, 25307.0, 41293.0, 64681.0, 95819.0, 128007.0, 147852.0, 144803.0, 120243.0, 87359.0, 58465.0, 37036.0, 22738.0, 13820.0, 8237.0, 5183.0, 3134.0, 1922.0, 1201.0, 724.0, 430.0, 286.0, 178.0, 114.0, 69.0, 51.0, 17.0, 16.0, 10.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0], "bins": [-5.72265625, -5.55859375, -5.39453125, -5.23046875, -5.06640625, -4.90234375, -4.73828125, -4.57421875, -4.41015625, -4.24609375, -4.08203125, -3.91796875, -3.75390625, -3.58984375, -3.42578125, -3.26171875, -3.09765625, -2.93359375, -2.76953125, -2.60546875, -2.44140625, -2.27734375, -2.11328125, -1.94921875, -1.78515625, -1.62109375, -1.45703125, -1.29296875, -1.12890625, -0.96484375, -0.80078125, -0.63671875, -0.47265625, -0.30859375, -0.14453125, 0.01953125, 0.18359375, 0.34765625, 0.51171875, 0.67578125, 0.83984375, 1.00390625, 1.16796875, 1.33203125, 1.49609375, 1.66015625, 1.82421875, 1.98828125, 2.15234375, 2.31640625, 2.48046875, 2.64453125, 2.80859375, 2.97265625, 3.13671875, 3.30078125, 3.46484375, 3.62890625, 3.79296875, 3.95703125, 4.12109375, 4.28515625, 4.44921875, 4.61328125, 4.77734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 6.0, 9.0, 8.0, 8.0, 11.0, 7.0, 9.0, 15.0, 19.0, 20.0, 39.0, 21.0, 34.0, 30.0, 46.0, 44.0, 51.0, 30.0, 38.0, 36.0, 48.0, 33.0, 37.0, 33.0, 40.0, 45.0, 36.0, 35.0, 27.0, 27.0, 34.0, 24.0, 22.0, 15.0, 15.0, 16.0, 5.0, 5.0, 10.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.140625, -4.95416259765625, -4.7677001953125, -4.58123779296875, -4.394775390625, -4.20831298828125, -4.0218505859375, -3.83538818359375, -3.64892578125, -3.46246337890625, -3.2760009765625, -3.08953857421875, -2.903076171875, -2.71661376953125, -2.5301513671875, -2.34368896484375, -2.1572265625, -1.97076416015625, -1.7843017578125, -1.59783935546875, -1.411376953125, -1.22491455078125, -1.0384521484375, -0.85198974609375, -0.66552734375, -0.47906494140625, -0.2926025390625, -0.10614013671875, 0.080322265625, 0.26678466796875, 0.4532470703125, 0.63970947265625, 0.826171875, 1.01263427734375, 1.1990966796875, 1.38555908203125, 1.572021484375, 1.75848388671875, 1.9449462890625, 2.13140869140625, 2.31787109375, 2.50433349609375, 2.6907958984375, 2.87725830078125, 3.063720703125, 3.25018310546875, 3.4366455078125, 3.62310791015625, 3.8095703125, 3.99603271484375, 4.1824951171875, 4.36895751953125, 4.555419921875, 4.74188232421875, 4.9283447265625, 5.11480712890625, 5.30126953125, 5.48773193359375, 5.6741943359375, 5.86065673828125, 6.047119140625, 6.23358154296875, 6.4200439453125, 6.60650634765625, 6.79296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 12.0, 8.0, 16.0, 29.0, 23.0, 53.0, 61.0, 108.0, 177.0, 294.0, 388.0, 647.0, 932.0, 1495.0, 2232.0, 3485.0, 5577.0, 8732.0, 14215.0, 21952.0, 35597.0, 54024.0, 79018.0, 107030.0, 129478.0, 138105.0, 126959.0, 103206.0, 74848.0, 50117.0, 33185.0, 20884.0, 13061.0, 8325.0, 5159.0, 3127.0, 2050.0, 1286.0, 954.0, 600.0, 371.0, 241.0, 181.0, 123.0, 73.0, 44.0, 33.0, 15.0, 10.0, 11.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.4609375, -5.29754638671875, -5.1341552734375, -4.97076416015625, -4.807373046875, -4.64398193359375, -4.4805908203125, -4.31719970703125, -4.15380859375, -3.99041748046875, -3.8270263671875, -3.66363525390625, -3.500244140625, -3.33685302734375, -3.1734619140625, -3.01007080078125, -2.8466796875, -2.68328857421875, -2.5198974609375, -2.35650634765625, -2.193115234375, -2.02972412109375, -1.8663330078125, -1.70294189453125, -1.53955078125, -1.37615966796875, -1.2127685546875, -1.04937744140625, -0.885986328125, -0.72259521484375, -0.5592041015625, -0.39581298828125, -0.232421875, -0.06903076171875, 0.0943603515625, 0.25775146484375, 0.421142578125, 0.58453369140625, 0.7479248046875, 0.91131591796875, 1.07470703125, 1.23809814453125, 1.4014892578125, 1.56488037109375, 1.728271484375, 1.89166259765625, 2.0550537109375, 2.21844482421875, 2.3818359375, 2.54522705078125, 2.7086181640625, 2.87200927734375, 3.035400390625, 3.19879150390625, 3.3621826171875, 3.52557373046875, 3.68896484375, 3.85235595703125, 4.0157470703125, 4.17913818359375, 4.342529296875, 4.50592041015625, 4.6693115234375, 4.83270263671875, 4.99609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 9.0, 6.0, 5.0, 10.0, 8.0, 7.0, 15.0, 9.0, 12.0, 19.0, 25.0, 24.0, 32.0, 33.0, 36.0, 23.0, 37.0, 44.0, 34.0, 44.0, 48.0, 47.0, 50.0, 36.0, 32.0, 39.0, 29.0, 23.0, 38.0, 28.0, 26.0, 27.0, 14.0, 28.0, 22.0, 18.0, 10.0, 10.0, 11.0, 11.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.505859375, -3.395751953125, -3.28564453125, -3.175537109375, -3.0654296875, -2.955322265625, -2.84521484375, -2.735107421875, -2.625, -2.514892578125, -2.40478515625, -2.294677734375, -2.1845703125, -2.074462890625, -1.96435546875, -1.854248046875, -1.744140625, -1.634033203125, -1.52392578125, -1.413818359375, -1.3037109375, -1.193603515625, -1.08349609375, -0.973388671875, -0.86328125, -0.753173828125, -0.64306640625, -0.532958984375, -0.4228515625, -0.312744140625, -0.20263671875, -0.092529296875, 0.017578125, 0.127685546875, 0.23779296875, 0.347900390625, 0.4580078125, 0.568115234375, 0.67822265625, 0.788330078125, 0.8984375, 1.008544921875, 1.11865234375, 1.228759765625, 1.3388671875, 1.448974609375, 1.55908203125, 1.669189453125, 1.779296875, 1.889404296875, 1.99951171875, 2.109619140625, 2.2197265625, 2.329833984375, 2.43994140625, 2.550048828125, 2.66015625, 2.770263671875, 2.88037109375, 2.990478515625, 3.1005859375, 3.210693359375, 3.32080078125, 3.430908203125, 3.541015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 10.0, 9.0, 17.0, 24.0, 39.0, 54.0, 78.0, 117.0, 169.0, 286.0, 453.0, 728.0, 1231.0, 2236.0, 3939.0, 7853.0, 15495.0, 31183.0, 61004.0, 111281.0, 173334.0, 206101.0, 179219.0, 118640.0, 65790.0, 33527.0, 16953.0, 8494.0, 4441.0, 2388.0, 1367.0, 753.0, 476.0, 292.0, 201.0, 112.0, 86.0, 51.0, 51.0, 23.0, 18.0, 9.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.798828125, -2.71014404296875, -2.6214599609375, -2.53277587890625, -2.444091796875, -2.35540771484375, -2.2667236328125, -2.17803955078125, -2.08935546875, -2.00067138671875, -1.9119873046875, -1.82330322265625, -1.734619140625, -1.64593505859375, -1.5572509765625, -1.46856689453125, -1.3798828125, -1.29119873046875, -1.2025146484375, -1.11383056640625, -1.025146484375, -0.93646240234375, -0.8477783203125, -0.75909423828125, -0.67041015625, -0.58172607421875, -0.4930419921875, -0.40435791015625, -0.315673828125, -0.22698974609375, -0.1383056640625, -0.04962158203125, 0.0390625, 0.12774658203125, 0.2164306640625, 0.30511474609375, 0.393798828125, 0.48248291015625, 0.5711669921875, 0.65985107421875, 0.74853515625, 0.83721923828125, 0.9259033203125, 1.01458740234375, 1.103271484375, 1.19195556640625, 1.2806396484375, 1.36932373046875, 1.4580078125, 1.54669189453125, 1.6353759765625, 1.72406005859375, 1.812744140625, 1.90142822265625, 1.9901123046875, 2.07879638671875, 2.16748046875, 2.25616455078125, 2.3448486328125, 2.43353271484375, 2.522216796875, 2.61090087890625, 2.6995849609375, 2.78826904296875, 2.876953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 13.0, 14.0, 19.0, 29.0, 20.0, 30.0, 49.0, 50.0, 62.0, 71.0, 81.0, 109.0, 69.0, 67.0, 66.0, 69.0, 50.0, 32.0, 20.0, 20.0, 13.0, 12.0, 11.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00042819976806640625, -0.00041736289858818054, -0.00040652602910995483, -0.0003956891596317291, -0.0003848522901535034, -0.0003740154206752777, -0.000363178551197052, -0.0003523416817188263, -0.0003415048122406006, -0.0003306679427623749, -0.00031983107328414917, -0.00030899420380592346, -0.00029815733432769775, -0.00028732046484947205, -0.00027648359537124634, -0.00026564672589302063, -0.0002548098564147949, -0.00024397298693656921, -0.0002331361174583435, -0.0002222992479801178, -0.0002114623785018921, -0.00020062550902366638, -0.00018978863954544067, -0.00017895177006721497, -0.00016811490058898926, -0.00015727803111076355, -0.00014644116163253784, -0.00013560429215431213, -0.00012476742267608643, -0.00011393055319786072, -0.00010309368371963501, -9.22568142414093e-05, -8.14199447631836e-05, -7.058307528495789e-05, -5.974620580673218e-05, -4.890933632850647e-05, -3.807246685028076e-05, -2.7235597372055054e-05, -1.6398727893829346e-05, -5.561858415603638e-06, 5.27501106262207e-06, 1.611188054084778e-05, 2.6948750019073486e-05, 3.7785619497299194e-05, 4.86224889755249e-05, 5.945935845375061e-05, 7.029622793197632e-05, 8.113309741020203e-05, 9.196996688842773e-05, 0.00010280683636665344, 0.00011364370584487915, 0.00012448057532310486, 0.00013531744480133057, 0.00014615431427955627, 0.00015699118375778198, 0.0001678280532360077, 0.0001786649227142334, 0.0001895017921924591, 0.00020033866167068481, 0.00021117553114891052, 0.00022201240062713623, 0.00023284927010536194, 0.00024368613958358765, 0.00025452300906181335, 0.00026535987854003906]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 11.0, 6.0, 11.0, 30.0, 35.0, 43.0, 72.0, 125.0, 175.0, 252.0, 379.0, 561.0, 916.0, 1327.0, 2120.0, 3439.0, 5299.0, 8728.0, 14052.0, 22777.0, 36584.0, 56140.0, 82609.0, 111613.0, 132890.0, 138902.0, 126516.0, 100549.0, 72557.0, 48592.0, 30892.0, 18846.0, 11621.0, 7164.0, 4565.0, 2922.0, 1787.0, 1136.0, 808.0, 518.0, 328.0, 228.0, 140.0, 93.0, 75.0, 38.0, 25.0, 18.0, 19.0, 14.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.8486328125, -1.7914276123046875, -1.734222412109375, -1.6770172119140625, -1.61981201171875, -1.5626068115234375, -1.505401611328125, -1.4481964111328125, -1.3909912109375, -1.3337860107421875, -1.276580810546875, -1.2193756103515625, -1.16217041015625, -1.1049652099609375, -1.047760009765625, -0.9905548095703125, -0.933349609375, -0.8761444091796875, -0.818939208984375, -0.7617340087890625, -0.70452880859375, -0.6473236083984375, -0.590118408203125, -0.5329132080078125, -0.4757080078125, -0.4185028076171875, -0.361297607421875, -0.3040924072265625, -0.24688720703125, -0.1896820068359375, -0.132476806640625, -0.0752716064453125, -0.01806640625, 0.0391387939453125, 0.096343994140625, 0.1535491943359375, 0.21075439453125, 0.2679595947265625, 0.325164794921875, 0.3823699951171875, 0.4395751953125, 0.4967803955078125, 0.553985595703125, 0.6111907958984375, 0.66839599609375, 0.7256011962890625, 0.782806396484375, 0.8400115966796875, 0.897216796875, 0.9544219970703125, 1.011627197265625, 1.0688323974609375, 1.12603759765625, 1.1832427978515625, 1.240447998046875, 1.2976531982421875, 1.3548583984375, 1.4120635986328125, 1.469268798828125, 1.5264739990234375, 1.58367919921875, 1.6408843994140625, 1.698089599609375, 1.7552947998046875, 1.8125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 6.0, 7.0, 12.0, 11.0, 23.0, 13.0, 26.0, 21.0, 30.0, 40.0, 35.0, 53.0, 55.0, 57.0, 51.0, 63.0, 50.0, 46.0, 62.0, 51.0, 42.0, 41.0, 41.0, 32.0, 22.0, 18.0, 15.0, 18.0, 14.0, 12.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.951171875, -0.9220352172851562, -0.8928985595703125, -0.8637619018554688, -0.834625244140625, -0.8054885864257812, -0.7763519287109375, -0.7472152709960938, -0.71807861328125, -0.6889419555664062, -0.6598052978515625, -0.6306686401367188, -0.601531982421875, -0.5723953247070312, -0.5432586669921875, -0.5141220092773438, -0.4849853515625, -0.45584869384765625, -0.4267120361328125, -0.39757537841796875, -0.368438720703125, -0.33930206298828125, -0.3101654052734375, -0.28102874755859375, -0.25189208984375, -0.22275543212890625, -0.1936187744140625, -0.16448211669921875, -0.135345458984375, -0.10620880126953125, -0.0770721435546875, -0.04793548583984375, -0.018798828125, 0.01033782958984375, 0.0394744873046875, 0.06861114501953125, 0.097747802734375, 0.12688446044921875, 0.1560211181640625, 0.18515777587890625, 0.21429443359375, 0.24343109130859375, 0.2725677490234375, 0.30170440673828125, 0.330841064453125, 0.35997772216796875, 0.3891143798828125, 0.41825103759765625, 0.4473876953125, 0.47652435302734375, 0.5056610107421875, 0.5347976684570312, 0.563934326171875, 0.5930709838867188, 0.6222076416015625, 0.6513442993164062, 0.68048095703125, 0.7096176147460938, 0.7387542724609375, 0.7678909301757812, 0.797027587890625, 0.8261642456054688, 0.8553009033203125, 0.8844375610351562, 0.91357421875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 7.0, 8.0, 10.0, 14.0, 14.0, 17.0, 22.0, 31.0, 30.0, 38.0, 32.0, 39.0, 41.0, 52.0, 47.0, 62.0, 49.0, 52.0, 60.0, 44.0, 58.0, 40.0, 33.0, 28.0, 29.0, 27.0, 17.0, 23.0, 13.0, 16.0, 13.0, 8.0, 4.0, 5.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.312180042266846, -6.101543426513672, -5.890907287597656, -5.680270671844482, -5.469634532928467, -5.258997917175293, -5.048361778259277, -4.8377251625061035, -4.627089023590088, -4.416452407836914, -4.205816268920898, -3.9951798915863037, -3.784543514251709, -3.573906898498535, -3.3632707595825195, -3.1526341438293457, -2.941997766494751, -2.7313613891601562, -2.5207250118255615, -2.310088634490967, -2.099452257156372, -1.8888157606124878, -1.678179383277893, -1.4675430059432983, -1.2569066286087036, -1.0462702512741089, -0.8356338739395142, -0.6249974370002747, -0.41436105966567993, -0.20372462272644043, 0.006911754608154297, 0.21754813194274902, 0.42818450927734375, 0.6388208866119385, 0.8494572639465332, 1.060093641281128, 1.2707300186157227, 1.481366515159607, 1.6920028924942017, 1.9026392698287964, 2.1132755279541016, 2.3239119052886963, 2.534548282623291, 2.7451846599578857, 2.9558210372924805, 3.1664576530456543, 3.37709379196167, 3.5877304077148438, 3.7983667850494385, 4.009003162384033, 4.219639778137207, 4.430275917053223, 4.6409125328063965, 4.851548671722412, 5.062185287475586, 5.272821426391602, 5.483458042144775, 5.694094657897949, 5.904730796813965, 6.115367412567139, 6.326003551483154, 6.536640167236328, 6.747276306152344, 6.957912921905518, 7.168549060821533]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 13.0, 13.0, 15.0, 21.0, 26.0, 25.0, 21.0, 19.0, 23.0, 30.0, 35.0, 35.0, 31.0, 41.0, 29.0, 37.0, 43.0, 46.0, 35.0, 42.0, 45.0, 38.0, 35.0, 33.0, 33.0, 26.0, 29.0, 30.0, 21.0, 18.0, 18.0, 22.0, 15.0, 9.0, 10.0, 13.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.399958610534668, -5.217442035675049, -5.0349249839782715, -4.852408409118652, -4.669891834259033, -4.487375259399414, -4.304858207702637, -4.122341632843018, -3.9398248195648193, -3.757308006286621, -3.574791431427002, -3.3922746181488037, -3.2097578048706055, -3.0272412300109863, -2.844724416732788, -2.66220760345459, -2.4796910285949707, -2.2971742153167725, -2.1146576404571533, -1.932140827178955, -1.7496241331100464, -1.5671074390411377, -1.3845906257629395, -1.2020739316940308, -1.019557237625122, -0.8370405435562134, -0.6545237898826599, -0.47200703620910645, -0.28949034214019775, -0.10697364807128906, 0.07554316520690918, 0.25805985927581787, 0.44057655334472656, 0.6230932474136353, 0.8056100010871887, 0.9881267547607422, 1.1706434488296509, 1.3531601428985596, 1.5356769561767578, 1.7181936502456665, 1.9007103443145752, 2.0832271575927734, 2.2657437324523926, 2.448260545730591, 2.630777359008789, 2.813293933868408, 2.9958107471466064, 3.1783275604248047, 3.360844135284424, 3.543360948562622, 3.725877523422241, 3.9083943367004395, 4.090910911560059, 4.273427963256836, 4.455944538116455, 4.638461112976074, 4.820978164672852, 5.003494739532471, 5.186011791229248, 5.368528366088867, 5.551044940948486, 5.7335615158081055, 5.916078567504883, 6.098595142364502, 6.281111717224121]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 15.0, 16.0, 30.0, 48.0, 54.0, 85.0, 138.0, 206.0, 310.0, 438.0, 766.0, 1158.0, 1836.0, 2976.0, 5212.0, 8973.0, 16030.0, 28656.0, 53468.0, 100678.0, 190208.0, 351530.0, 578396.0, 767768.0, 764245.0, 573562.0, 345202.0, 186223.0, 97259.0, 51954.0, 28454.0, 15662.0, 8854.0, 5181.0, 3208.0, 1950.0, 1207.0, 733.0, 551.0, 314.0, 228.0, 168.0, 89.0, 69.0, 43.0, 37.0, 25.0, 19.0, 15.0, 15.0, 2.0, 5.0, 6.0, 0.0, 1.0, 3.0], "bins": [-5.2734375, -5.10858154296875, -4.9437255859375, -4.77886962890625, -4.614013671875, -4.44915771484375, -4.2843017578125, -4.11944580078125, -3.95458984375, -3.78973388671875, -3.6248779296875, -3.46002197265625, -3.295166015625, -3.13031005859375, -2.9654541015625, -2.80059814453125, -2.6357421875, -2.47088623046875, -2.3060302734375, -2.14117431640625, -1.976318359375, -1.81146240234375, -1.6466064453125, -1.48175048828125, -1.31689453125, -1.15203857421875, -0.9871826171875, -0.82232666015625, -0.657470703125, -0.49261474609375, -0.3277587890625, -0.16290283203125, 0.001953125, 0.16680908203125, 0.3316650390625, 0.49652099609375, 0.661376953125, 0.82623291015625, 0.9910888671875, 1.15594482421875, 1.32080078125, 1.48565673828125, 1.6505126953125, 1.81536865234375, 1.980224609375, 2.14508056640625, 2.3099365234375, 2.47479248046875, 2.6396484375, 2.80450439453125, 2.9693603515625, 3.13421630859375, 3.299072265625, 3.46392822265625, 3.6287841796875, 3.79364013671875, 3.95849609375, 4.12335205078125, 4.2882080078125, 4.45306396484375, 4.617919921875, 4.78277587890625, 4.9476318359375, 5.11248779296875, 5.27734375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 4.0, 2.0, 9.0, 6.0, 10.0, 14.0, 22.0, 24.0, 19.0, 18.0, 32.0, 29.0, 30.0, 35.0, 27.0, 33.0, 37.0, 34.0, 35.0, 40.0, 40.0, 56.0, 57.0, 37.0, 34.0, 36.0, 28.0, 31.0, 32.0, 22.0, 25.0, 17.0, 30.0, 13.0, 25.0, 12.0, 7.0, 10.0, 11.0, 8.0, 12.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6484375, -4.48724365234375, -4.3260498046875, -4.16485595703125, -4.003662109375, -3.84246826171875, -3.6812744140625, -3.52008056640625, -3.35888671875, -3.19769287109375, -3.0364990234375, -2.87530517578125, -2.714111328125, -2.55291748046875, -2.3917236328125, -2.23052978515625, -2.0693359375, -1.90814208984375, -1.7469482421875, -1.58575439453125, -1.424560546875, -1.26336669921875, -1.1021728515625, -0.94097900390625, -0.77978515625, -0.61859130859375, -0.4573974609375, -0.29620361328125, -0.135009765625, 0.02618408203125, 0.1873779296875, 0.34857177734375, 0.509765625, 0.67095947265625, 0.8321533203125, 0.99334716796875, 1.154541015625, 1.31573486328125, 1.4769287109375, 1.63812255859375, 1.79931640625, 1.96051025390625, 2.1217041015625, 2.28289794921875, 2.444091796875, 2.60528564453125, 2.7664794921875, 2.92767333984375, 3.0888671875, 3.25006103515625, 3.4112548828125, 3.57244873046875, 3.733642578125, 3.89483642578125, 4.0560302734375, 4.21722412109375, 4.37841796875, 4.53961181640625, 4.7008056640625, 4.86199951171875, 5.023193359375, 5.18438720703125, 5.3455810546875, 5.50677490234375, 5.66796875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 3.0, 11.0, 16.0, 27.0, 34.0, 63.0, 113.0, 192.0, 278.0, 437.0, 705.0, 1169.0, 2028.0, 3434.0, 6013.0, 10209.0, 18367.0, 33454.0, 60593.0, 109856.0, 197489.0, 337968.0, 535485.0, 716031.0, 735319.0, 569228.0, 366833.0, 216248.0, 121704.0, 66718.0, 36540.0, 20476.0, 11393.0, 6435.0, 3821.0, 2209.0, 1335.0, 775.0, 494.0, 276.0, 182.0, 107.0, 81.0, 44.0, 30.0, 17.0, 15.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-6.26953125, -6.08001708984375, -5.8905029296875, -5.70098876953125, -5.511474609375, -5.32196044921875, -5.1324462890625, -4.94293212890625, -4.75341796875, -4.56390380859375, -4.3743896484375, -4.18487548828125, -3.995361328125, -3.80584716796875, -3.6163330078125, -3.42681884765625, -3.2373046875, -3.04779052734375, -2.8582763671875, -2.66876220703125, -2.479248046875, -2.28973388671875, -2.1002197265625, -1.91070556640625, -1.72119140625, -1.53167724609375, -1.3421630859375, -1.15264892578125, -0.963134765625, -0.77362060546875, -0.5841064453125, -0.39459228515625, -0.205078125, -0.01556396484375, 0.1739501953125, 0.36346435546875, 0.552978515625, 0.74249267578125, 0.9320068359375, 1.12152099609375, 1.31103515625, 1.50054931640625, 1.6900634765625, 1.87957763671875, 2.069091796875, 2.25860595703125, 2.4481201171875, 2.63763427734375, 2.8271484375, 3.01666259765625, 3.2061767578125, 3.39569091796875, 3.585205078125, 3.77471923828125, 3.9642333984375, 4.15374755859375, 4.34326171875, 4.53277587890625, 4.7222900390625, 4.91180419921875, 5.101318359375, 5.29083251953125, 5.4803466796875, 5.66986083984375, 5.859375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 5.0, 5.0, 13.0, 13.0, 15.0, 20.0, 28.0, 38.0, 43.0, 53.0, 69.0, 78.0, 99.0, 109.0, 133.0, 137.0, 145.0, 150.0, 197.0, 206.0, 222.0, 246.0, 227.0, 223.0, 228.0, 179.0, 178.0, 144.0, 140.0, 148.0, 118.0, 70.0, 64.0, 71.0, 55.0, 52.0, 29.0, 21.0, 26.0, 18.0, 10.0, 11.0, 10.0, 6.0, 6.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.962890625, -1.894744873046875, -1.82659912109375, -1.758453369140625, -1.6903076171875, -1.622161865234375, -1.55401611328125, -1.485870361328125, -1.417724609375, -1.349578857421875, -1.28143310546875, -1.213287353515625, -1.1451416015625, -1.076995849609375, -1.00885009765625, -0.940704345703125, -0.87255859375, -0.804412841796875, -0.73626708984375, -0.668121337890625, -0.5999755859375, -0.531829833984375, -0.46368408203125, -0.395538330078125, -0.327392578125, -0.259246826171875, -0.19110107421875, -0.122955322265625, -0.0548095703125, 0.013336181640625, 0.08148193359375, 0.149627685546875, 0.2177734375, 0.285919189453125, 0.35406494140625, 0.422210693359375, 0.4903564453125, 0.558502197265625, 0.62664794921875, 0.694793701171875, 0.762939453125, 0.831085205078125, 0.89923095703125, 0.967376708984375, 1.0355224609375, 1.103668212890625, 1.17181396484375, 1.239959716796875, 1.30810546875, 1.376251220703125, 1.44439697265625, 1.512542724609375, 1.5806884765625, 1.648834228515625, 1.71697998046875, 1.785125732421875, 1.853271484375, 1.921417236328125, 1.98956298828125, 2.057708740234375, 2.1258544921875, 2.194000244140625, 2.26214599609375, 2.330291748046875, 2.3984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 8.0, 14.0, 12.0, 18.0, 11.0, 20.0, 22.0, 30.0, 41.0, 45.0, 41.0, 33.0, 46.0, 47.0, 80.0, 64.0, 47.0, 56.0, 57.0, 40.0, 35.0, 44.0, 28.0, 26.0, 23.0, 23.0, 13.0, 24.0, 8.0, 6.0, 2.0, 5.0, 5.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-7.452527046203613, -7.24315071105957, -7.033774375915527, -6.824398040771484, -6.6150221824646, -6.405645847320557, -6.196269512176514, -5.986893177032471, -5.777517318725586, -5.568140983581543, -5.3587646484375, -5.149388313293457, -4.940012454986572, -4.730636119842529, -4.521259784698486, -4.311883449554443, -4.1025071144104, -3.8931307792663574, -3.6837546825408936, -3.4743783473968506, -3.2650022506713867, -3.0556259155273438, -2.846249580383301, -2.636873245239258, -2.427497148513794, -2.218120813369751, -2.008744716644287, -1.7993683815002441, -1.5899921655654907, -1.3806159496307373, -1.1712396144866943, -0.9618633985519409, -0.7524867057800293, -0.5431104898452759, -0.3337342143058777, -0.12435793876647949, 0.08501827716827393, 0.29439449310302734, 0.5037708282470703, 0.7131470441818237, 0.9225232601165771, 1.1318994760513306, 1.341275691986084, 1.550652027130127, 1.7600282430648804, 1.9694044589996338, 2.1787807941436768, 2.3881568908691406, 2.5975332260131836, 2.8069095611572266, 3.0162856578826904, 3.2256619930267334, 3.4350380897521973, 3.6444144248962402, 3.853790760040283, 4.063167095184326, 4.272542953491211, 4.481919288635254, 4.691295623779297, 4.90067195892334, 5.110047817230225, 5.319424152374268, 5.5288004875183105, 5.7381768226623535, 5.9475531578063965]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 12.0, 13.0, 13.0, 22.0, 19.0, 23.0, 25.0, 26.0, 23.0, 32.0, 35.0, 35.0, 42.0, 40.0, 46.0, 36.0, 41.0, 47.0, 45.0, 37.0, 46.0, 43.0, 46.0, 33.0, 33.0, 31.0, 34.0, 17.0, 22.0, 16.0, 15.0, 8.0, 7.0, 8.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.150420665740967, -4.953828811645508, -4.757237434387207, -4.560645580291748, -4.364053726196289, -4.16746187210083, -3.97087025642395, -3.7742786407470703, -3.5776867866516113, -3.3810949325561523, -3.1845033168792725, -2.9879117012023926, -2.7913198471069336, -2.5947279930114746, -2.3981363773345947, -2.201544761657715, -2.004952907562256, -1.8083611726760864, -1.611769437789917, -1.4151777029037476, -1.2185859680175781, -1.0219942331314087, -0.8254024982452393, -0.6288107633590698, -0.4322190284729004, -0.23562729358673096, -0.03903555870056152, 0.1575561761856079, 0.35414791107177734, 0.5507396459579468, 0.7473313808441162, 0.9439231157302856, 1.1405143737792969, 1.3371061086654663, 1.5336978435516357, 1.7302895784378052, 1.9268813133239746, 2.1234731674194336, 2.3200647830963135, 2.5166563987731934, 2.7132482528686523, 2.9098401069641113, 3.106431722640991, 3.303023338317871, 3.49961519241333, 3.696207046508789, 3.892798662185669, 4.089390277862549, 4.285982131958008, 4.482573986053467, 4.679165840148926, 4.875757217407227, 5.0723490715026855, 5.2689409255981445, 5.465532302856445, 5.662124156951904, 5.858716011047363, 6.055307865142822, 6.251899719238281, 6.448491096496582, 6.645082950592041, 6.8416748046875, 7.038266181945801, 7.23485803604126, 7.431449890136719]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 8.0, 5.0, 15.0, 21.0, 30.0, 42.0, 53.0, 96.0, 138.0, 245.0, 374.0, 518.0, 808.0, 1300.0, 1782.0, 2688.0, 4168.0, 6401.0, 9854.0, 14951.0, 23067.0, 36119.0, 53989.0, 80105.0, 110238.0, 135729.0, 143535.0, 126548.0, 96780.0, 68136.0, 45438.0, 30026.0, 19323.0, 12373.0, 8191.0, 5302.0, 3427.0, 2224.0, 1568.0, 1006.0, 641.0, 432.0, 290.0, 202.0, 126.0, 77.0, 51.0, 39.0, 22.0, 13.0, 14.0, 10.0, 10.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.28515625, -1.24127197265625, -1.1973876953125, -1.15350341796875, -1.109619140625, -1.06573486328125, -1.0218505859375, -0.97796630859375, -0.93408203125, -0.89019775390625, -0.8463134765625, -0.80242919921875, -0.758544921875, -0.71466064453125, -0.6707763671875, -0.62689208984375, -0.5830078125, -0.53912353515625, -0.4952392578125, -0.45135498046875, -0.407470703125, -0.36358642578125, -0.3197021484375, -0.27581787109375, -0.23193359375, -0.18804931640625, -0.1441650390625, -0.10028076171875, -0.056396484375, -0.01251220703125, 0.0313720703125, 0.07525634765625, 0.119140625, 0.16302490234375, 0.2069091796875, 0.25079345703125, 0.294677734375, 0.33856201171875, 0.3824462890625, 0.42633056640625, 0.47021484375, 0.51409912109375, 0.5579833984375, 0.60186767578125, 0.645751953125, 0.68963623046875, 0.7335205078125, 0.77740478515625, 0.8212890625, 0.86517333984375, 0.9090576171875, 0.95294189453125, 0.996826171875, 1.04071044921875, 1.0845947265625, 1.12847900390625, 1.17236328125, 1.21624755859375, 1.2601318359375, 1.30401611328125, 1.347900390625, 1.39178466796875, 1.4356689453125, 1.47955322265625, 1.5234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 7.0, 9.0, 12.0, 17.0, 17.0, 21.0, 13.0, 22.0, 28.0, 29.0, 30.0, 34.0, 35.0, 31.0, 42.0, 32.0, 39.0, 41.0, 49.0, 31.0, 47.0, 33.0, 35.0, 36.0, 31.0, 30.0, 35.0, 43.0, 31.0, 25.0, 24.0, 13.0, 5.0, 16.0, 7.0, 9.0, 6.0, 6.0, 7.0, 3.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.1507568359375, -4.965576171875, -4.7803955078125, -4.59521484375, -4.4100341796875, -4.224853515625, -4.0396728515625, -3.8544921875, -3.6693115234375, -3.484130859375, -3.2989501953125, -3.11376953125, -2.9285888671875, -2.743408203125, -2.5582275390625, -2.373046875, -2.1878662109375, -2.002685546875, -1.8175048828125, -1.63232421875, -1.4471435546875, -1.261962890625, -1.0767822265625, -0.8916015625, -0.7064208984375, -0.521240234375, -0.3360595703125, -0.15087890625, 0.0343017578125, 0.219482421875, 0.4046630859375, 0.58984375, 0.7750244140625, 0.960205078125, 1.1453857421875, 1.33056640625, 1.5157470703125, 1.700927734375, 1.8861083984375, 2.0712890625, 2.2564697265625, 2.441650390625, 2.6268310546875, 2.81201171875, 2.9971923828125, 3.182373046875, 3.3675537109375, 3.552734375, 3.7379150390625, 3.923095703125, 4.1082763671875, 4.29345703125, 4.4786376953125, 4.663818359375, 4.8489990234375, 5.0341796875, 5.2193603515625, 5.404541015625, 5.5897216796875, 5.77490234375, 5.9600830078125, 6.145263671875, 6.3304443359375, 6.515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 11.0, 8.0, 7.0, 16.0, 26.0, 31.0, 43.0, 61.0, 78.0, 133.0, 241.0, 374.0, 636.0, 1100.0, 1883.0, 3379.0, 6412.0, 12222.0, 25107.0, 101004.0, 805627.0, 49196.0, 19424.0, 9712.0, 5122.0, 2826.0, 1514.0, 890.0, 510.0, 329.0, 210.0, 137.0, 64.0, 60.0, 36.0, 36.0, 21.0, 19.0, 9.0, 6.0, 13.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.1080322265625, -5.919189453125, -5.7303466796875, -5.54150390625, -5.3526611328125, -5.163818359375, -4.9749755859375, -4.7861328125, -4.5972900390625, -4.408447265625, -4.2196044921875, -4.03076171875, -3.8419189453125, -3.653076171875, -3.4642333984375, -3.275390625, -3.0865478515625, -2.897705078125, -2.7088623046875, -2.52001953125, -2.3311767578125, -2.142333984375, -1.9534912109375, -1.7646484375, -1.5758056640625, -1.386962890625, -1.1981201171875, -1.00927734375, -0.8204345703125, -0.631591796875, -0.4427490234375, -0.25390625, -0.0650634765625, 0.123779296875, 0.3126220703125, 0.50146484375, 0.6903076171875, 0.879150390625, 1.0679931640625, 1.2568359375, 1.4456787109375, 1.634521484375, 1.8233642578125, 2.01220703125, 2.2010498046875, 2.389892578125, 2.5787353515625, 2.767578125, 2.9564208984375, 3.145263671875, 3.3341064453125, 3.52294921875, 3.7117919921875, 3.900634765625, 4.0894775390625, 4.2783203125, 4.4671630859375, 4.656005859375, 4.8448486328125, 5.03369140625, 5.2225341796875, 5.411376953125, 5.6002197265625, 5.7890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 6.0, 9.0, 14.0, 10.0, 8.0, 21.0, 11.0, 22.0, 19.0, 17.0, 31.0, 24.0, 40.0, 33.0, 46.0, 46.0, 39.0, 52.0, 58.0, 54.0, 49.0, 41.0, 32.0, 39.0, 30.0, 33.0, 36.0, 35.0, 22.0, 17.0, 21.0, 18.0, 18.0, 9.0, 7.0, 4.0, 5.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.75, -4.60888671875, -4.4677734375, -4.32666015625, -4.185546875, -4.04443359375, -3.9033203125, -3.76220703125, -3.62109375, -3.47998046875, -3.3388671875, -3.19775390625, -3.056640625, -2.91552734375, -2.7744140625, -2.63330078125, -2.4921875, -2.35107421875, -2.2099609375, -2.06884765625, -1.927734375, -1.78662109375, -1.6455078125, -1.50439453125, -1.36328125, -1.22216796875, -1.0810546875, -0.93994140625, -0.798828125, -0.65771484375, -0.5166015625, -0.37548828125, -0.234375, -0.09326171875, 0.0478515625, 0.18896484375, 0.330078125, 0.47119140625, 0.6123046875, 0.75341796875, 0.89453125, 1.03564453125, 1.1767578125, 1.31787109375, 1.458984375, 1.60009765625, 1.7412109375, 1.88232421875, 2.0234375, 2.16455078125, 2.3056640625, 2.44677734375, 2.587890625, 2.72900390625, 2.8701171875, 3.01123046875, 3.15234375, 3.29345703125, 3.4345703125, 3.57568359375, 3.716796875, 3.85791015625, 3.9990234375, 4.14013671875, 4.28125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 10.0, 6.0, 15.0, 15.0, 15.0, 24.0, 30.0, 47.0, 78.0, 93.0, 141.0, 185.0, 293.0, 466.0, 734.0, 1213.0, 2055.0, 3783.0, 6687.0, 12456.0, 24724.0, 96356.0, 789656.0, 61904.0, 21630.0, 11295.0, 6034.0, 3396.0, 1904.0, 1185.0, 680.0, 449.0, 323.0, 177.0, 134.0, 86.0, 62.0, 37.0, 54.0, 35.0, 26.0, 22.0, 13.0, 8.0, 12.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.41748046875, -0.4041900634765625, -0.390899658203125, -0.3776092529296875, -0.36431884765625, -0.3510284423828125, -0.337738037109375, -0.3244476318359375, -0.3111572265625, -0.2978668212890625, -0.284576416015625, -0.2712860107421875, -0.25799560546875, -0.2447052001953125, -0.231414794921875, -0.2181243896484375, -0.204833984375, -0.1915435791015625, -0.178253173828125, -0.1649627685546875, -0.15167236328125, -0.1383819580078125, -0.125091552734375, -0.1118011474609375, -0.0985107421875, -0.0852203369140625, -0.071929931640625, -0.0586395263671875, -0.04534912109375, -0.0320587158203125, -0.018768310546875, -0.0054779052734375, 0.0078125, 0.0211029052734375, 0.034393310546875, 0.0476837158203125, 0.06097412109375, 0.0742645263671875, 0.087554931640625, 0.1008453369140625, 0.1141357421875, 0.1274261474609375, 0.140716552734375, 0.1540069580078125, 0.16729736328125, 0.1805877685546875, 0.193878173828125, 0.2071685791015625, 0.220458984375, 0.2337493896484375, 0.247039794921875, 0.2603302001953125, 0.27362060546875, 0.2869110107421875, 0.300201416015625, 0.3134918212890625, 0.3267822265625, 0.3400726318359375, 0.353363037109375, 0.3666534423828125, 0.37994384765625, 0.3932342529296875, 0.406524658203125, 0.4198150634765625, 0.43310546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 3.0, 10.0, 6.0, 12.0, 9.0, 9.0, 16.0, 13.0, 14.0, 31.0, 32.0, 24.0, 26.0, 33.0, 32.0, 26.0, 46.0, 43.0, 37.0, 47.0, 38.0, 61.0, 52.0, 53.0, 37.0, 32.0, 40.0, 30.0, 26.0, 33.0, 22.0, 17.0, 9.0, 14.0, 14.0, 9.0, 8.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.4616718292236328e-05, -2.379622310400009e-05, -2.2975727915763855e-05, -2.215523272752762e-05, -2.1334737539291382e-05, -2.0514242351055145e-05, -1.969374716281891e-05, -1.8873251974582672e-05, -1.8052756786346436e-05, -1.72322615981102e-05, -1.6411766409873962e-05, -1.5591271221637726e-05, -1.477077603340149e-05, -1.3950280845165253e-05, -1.3129785656929016e-05, -1.230929046869278e-05, -1.1488795280456543e-05, -1.0668300092220306e-05, -9.84780490398407e-06, -9.027309715747833e-06, -8.206814527511597e-06, -7.38631933927536e-06, -6.5658241510391235e-06, -5.745328962802887e-06, -4.92483377456665e-06, -4.104338586330414e-06, -3.2838433980941772e-06, -2.4633482098579407e-06, -1.642853021621704e-06, -8.223578333854675e-07, -1.862645149230957e-09, 8.186325430870056e-07, 1.6391277313232422e-06, 2.4596229195594788e-06, 3.2801181077957153e-06, 4.100613296031952e-06, 4.9211084842681885e-06, 5.741603672504425e-06, 6.562098860740662e-06, 7.382594048976898e-06, 8.203089237213135e-06, 9.023584425449371e-06, 9.844079613685608e-06, 1.0664574801921844e-05, 1.1485069990158081e-05, 1.2305565178394318e-05, 1.3126060366630554e-05, 1.394655555486679e-05, 1.4767050743103027e-05, 1.5587545931339264e-05, 1.64080411195755e-05, 1.7228536307811737e-05, 1.8049031496047974e-05, 1.886952668428421e-05, 1.9690021872520447e-05, 2.0510517060756683e-05, 2.133101224899292e-05, 2.2151507437229156e-05, 2.2972002625465393e-05, 2.379249781370163e-05, 2.4612993001937866e-05, 2.5433488190174103e-05, 2.625398337841034e-05, 2.7074478566646576e-05, 2.7894973754882812e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 12.0, 23.0, 24.0, 41.0, 53.0, 97.0, 129.0, 170.0, 264.0, 355.0, 559.0, 786.0, 1153.0, 1719.0, 2515.0, 3897.0, 5775.0, 8917.0, 13976.0, 21616.0, 34141.0, 54578.0, 86094.0, 126477.0, 158701.0, 158793.0, 127060.0, 87218.0, 55462.0, 34635.0, 22062.0, 14076.0, 9106.0, 6000.0, 3837.0, 2748.0, 1726.0, 1192.0, 809.0, 521.0, 377.0, 273.0, 179.0, 122.0, 97.0, 64.0, 53.0, 21.0, 17.0, 10.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0], "bins": [-0.30908203125, -0.29972076416015625, -0.2903594970703125, -0.28099822998046875, -0.271636962890625, -0.26227569580078125, -0.2529144287109375, -0.24355316162109375, -0.23419189453125, -0.22483062744140625, -0.2154693603515625, -0.20610809326171875, -0.196746826171875, -0.18738555908203125, -0.1780242919921875, -0.16866302490234375, -0.1593017578125, -0.14994049072265625, -0.1405792236328125, -0.13121795654296875, -0.121856689453125, -0.11249542236328125, -0.1031341552734375, -0.09377288818359375, -0.08441162109375, -0.07505035400390625, -0.0656890869140625, -0.05632781982421875, -0.046966552734375, -0.03760528564453125, -0.0282440185546875, -0.01888275146484375, -0.009521484375, -0.00016021728515625, 0.0092010498046875, 0.01856231689453125, 0.027923583984375, 0.03728485107421875, 0.0466461181640625, 0.05600738525390625, 0.06536865234375, 0.07472991943359375, 0.0840911865234375, 0.09345245361328125, 0.102813720703125, 0.11217498779296875, 0.1215362548828125, 0.13089752197265625, 0.1402587890625, 0.14962005615234375, 0.1589813232421875, 0.16834259033203125, 0.177703857421875, 0.18706512451171875, 0.1964263916015625, 0.20578765869140625, 0.21514892578125, 0.22451019287109375, 0.2338714599609375, 0.24323272705078125, 0.252593994140625, 0.26195526123046875, 0.2713165283203125, 0.28067779541015625, 0.2900390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 11.0, 7.0, 3.0, 7.0, 8.0, 10.0, 22.0, 23.0, 26.0, 23.0, 36.0, 39.0, 53.0, 53.0, 58.0, 73.0, 67.0, 77.0, 51.0, 63.0, 47.0, 38.0, 43.0, 37.0, 18.0, 18.0, 20.0, 14.0, 15.0, 12.0, 3.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.16357421875, -0.15824317932128906, -0.15291213989257812, -0.1475811004638672, -0.14225006103515625, -0.1369190216064453, -0.13158798217773438, -0.12625694274902344, -0.1209259033203125, -0.11559486389160156, -0.11026382446289062, -0.10493278503417969, -0.09960174560546875, -0.09427070617675781, -0.08893966674804688, -0.08360862731933594, -0.078277587890625, -0.07294654846191406, -0.06761550903320312, -0.06228446960449219, -0.05695343017578125, -0.05162239074707031, -0.046291351318359375, -0.04096031188964844, -0.0356292724609375, -0.030298233032226562, -0.024967193603515625, -0.019636154174804688, -0.01430511474609375, -0.008974075317382812, -0.003643035888671875, 0.0016880035400390625, 0.00701904296875, 0.012350082397460938, 0.017681121826171875, 0.023012161254882812, 0.02834320068359375, 0.03367424011230469, 0.039005279541015625, 0.04433631896972656, 0.0496673583984375, 0.05499839782714844, 0.060329437255859375, 0.06566047668457031, 0.07099151611328125, 0.07632255554199219, 0.08165359497070312, 0.08698463439941406, 0.092315673828125, 0.09764671325683594, 0.10297775268554688, 0.10830879211425781, 0.11363983154296875, 0.11897087097167969, 0.12430191040039062, 0.12963294982910156, 0.1349639892578125, 0.14029502868652344, 0.14562606811523438, 0.1509571075439453, 0.15628814697265625, 0.1616191864013672, 0.16695022583007812, 0.17228126525878906, 0.1776123046875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 11.0, 11.0, 14.0, 18.0, 20.0, 21.0, 30.0, 29.0, 51.0, 42.0, 42.0, 33.0, 73.0, 60.0, 68.0, 57.0, 50.0, 55.0, 38.0, 42.0, 36.0, 31.0, 33.0, 21.0, 19.0, 25.0, 11.0, 10.0, 7.0, 2.0, 3.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-7.77983283996582, -7.567878723144531, -7.355924606323242, -7.143970489501953, -6.932016372680664, -6.720062255859375, -6.508108139038086, -6.296154022216797, -6.084199905395508, -5.872245788574219, -5.66029167175293, -5.448337554931641, -5.236383438110352, -5.0244293212890625, -4.812475204467773, -4.600521087646484, -4.388566493988037, -4.176612377166748, -3.964658260345459, -3.75270414352417, -3.540750026702881, -3.328795909881592, -3.1168415546417236, -2.9048874378204346, -2.6929333209991455, -2.4809792041778564, -2.2690250873565674, -2.057070732116699, -1.8451167345046997, -1.6331626176834106, -1.421208381652832, -1.209254264831543, -0.9973001480102539, -0.7853460311889648, -0.573391854763031, -0.36143767833709717, -0.1494835615158081, 0.06247055530548096, 0.27442479133605957, 0.48637890815734863, 0.6983330249786377, 0.9102871417999268, 1.1222412586212158, 1.3341954946517944, 1.5461496114730835, 1.7581037282943726, 1.9700579643249512, 2.1820120811462402, 2.3939661979675293, 2.6059203147888184, 2.8178744316101074, 3.0298285484313965, 3.2417826652526855, 3.4537367820739746, 3.6656911373138428, 3.877645254135132, 4.089599609375, 4.301553726196289, 4.513507843017578, 4.725461959838867, 4.937416076660156, 5.149370193481445, 5.361324310302734, 5.573278427124023, 5.7852325439453125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 15.0, 10.0, 18.0, 17.0, 23.0, 23.0, 25.0, 26.0, 25.0, 27.0, 40.0, 36.0, 42.0, 36.0, 44.0, 41.0, 43.0, 52.0, 45.0, 34.0, 42.0, 52.0, 40.0, 35.0, 29.0, 31.0, 33.0, 17.0, 19.0, 15.0, 13.0, 12.0, 4.0, 10.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.081655025482178, -4.885140895843506, -4.688626766204834, -4.492112636566162, -4.29559850692749, -4.099084377288818, -3.9025702476501465, -3.7060561180114746, -3.5095419883728027, -3.313027858734131, -3.116513729095459, -2.919999599456787, -2.7234854698181152, -2.5269713401794434, -2.3304572105407715, -2.1339430809020996, -1.9374287128448486, -1.7409145832061768, -1.5444004535675049, -1.347886323928833, -1.1513721942901611, -0.9548580050468445, -0.7583438158035278, -0.561829686164856, -0.3653155565261841, -0.168801411986351, 0.027712732553482056, 0.22422689199447632, 0.4207410216331482, 0.6172551512718201, 0.8137693405151367, 1.0102834701538086, 1.2067975997924805, 1.4033117294311523, 1.5998258590698242, 1.796339988708496, 1.992854118347168, 2.18936824798584, 2.3858823776245117, 2.5823965072631836, 2.7789106369018555, 2.9754247665405273, 3.171938896179199, 3.368453025817871, 3.564967155456543, 3.761481285095215, 3.9579954147338867, 4.154509544372559, 4.3510236740112305, 4.547537803649902, 4.744051933288574, 4.940566062927246, 5.137080192565918, 5.33359432220459, 5.530108451843262, 5.726622581481934, 5.923137187957764, 6.1196513175964355, 6.316165447235107, 6.512679576873779, 6.709193706512451, 6.905707836151123, 7.102221965789795, 7.298736095428467, 7.495250225067139]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 13.0, 11.0, 25.0, 39.0, 49.0, 73.0, 116.0, 160.0, 272.0, 392.0, 579.0, 881.0, 1351.0, 2095.0, 3317.0, 5453.0, 8180.0, 13612.0, 21504.0, 34337.0, 53216.0, 79555.0, 109135.0, 134344.0, 142906.0, 129502.0, 102246.0, 73495.0, 48192.0, 31038.0, 19454.0, 11988.0, 7609.0, 4803.0, 3010.0, 1919.0, 1237.0, 860.0, 531.0, 355.0, 247.0, 132.0, 121.0, 69.0, 37.0, 35.0, 25.0, 7.0, 7.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.60546875, -4.458740234375, -4.31201171875, -4.165283203125, -4.0185546875, -3.871826171875, -3.72509765625, -3.578369140625, -3.431640625, -3.284912109375, -3.13818359375, -2.991455078125, -2.8447265625, -2.697998046875, -2.55126953125, -2.404541015625, -2.2578125, -2.111083984375, -1.96435546875, -1.817626953125, -1.6708984375, -1.524169921875, -1.37744140625, -1.230712890625, -1.083984375, -0.937255859375, -0.79052734375, -0.643798828125, -0.4970703125, -0.350341796875, -0.20361328125, -0.056884765625, 0.08984375, 0.236572265625, 0.38330078125, 0.530029296875, 0.6767578125, 0.823486328125, 0.97021484375, 1.116943359375, 1.263671875, 1.410400390625, 1.55712890625, 1.703857421875, 1.8505859375, 1.997314453125, 2.14404296875, 2.290771484375, 2.4375, 2.584228515625, 2.73095703125, 2.877685546875, 3.0244140625, 3.171142578125, 3.31787109375, 3.464599609375, 3.611328125, 3.758056640625, 3.90478515625, 4.051513671875, 4.1982421875, 4.344970703125, 4.49169921875, 4.638427734375, 4.78515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 12.0, 18.0, 18.0, 24.0, 27.0, 25.0, 26.0, 21.0, 28.0, 36.0, 36.0, 49.0, 37.0, 43.0, 48.0, 39.0, 44.0, 45.0, 41.0, 43.0, 38.0, 30.0, 38.0, 40.0, 27.0, 18.0, 29.0, 15.0, 11.0, 12.0, 12.0, 12.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.2196044921875, -5.029052734375, -4.8385009765625, -4.64794921875, -4.4573974609375, -4.266845703125, -4.0762939453125, -3.8857421875, -3.6951904296875, -3.504638671875, -3.3140869140625, -3.12353515625, -2.9329833984375, -2.742431640625, -2.5518798828125, -2.361328125, -2.1707763671875, -1.980224609375, -1.7896728515625, -1.59912109375, -1.4085693359375, -1.218017578125, -1.0274658203125, -0.8369140625, -0.6463623046875, -0.455810546875, -0.2652587890625, -0.07470703125, 0.1158447265625, 0.306396484375, 0.4969482421875, 0.6875, 0.8780517578125, 1.068603515625, 1.2591552734375, 1.44970703125, 1.6402587890625, 1.830810546875, 2.0213623046875, 2.2119140625, 2.4024658203125, 2.593017578125, 2.7835693359375, 2.97412109375, 3.1646728515625, 3.355224609375, 3.5457763671875, 3.736328125, 3.9268798828125, 4.117431640625, 4.3079833984375, 4.49853515625, 4.6890869140625, 4.879638671875, 5.0701904296875, 5.2607421875, 5.4512939453125, 5.641845703125, 5.8323974609375, 6.02294921875, 6.2135009765625, 6.404052734375, 6.5946044921875, 6.78515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 9.0, 10.0, 16.0, 23.0, 29.0, 54.0, 71.0, 125.0, 216.0, 278.0, 397.0, 636.0, 939.0, 1393.0, 2033.0, 3057.0, 4606.0, 6771.0, 10277.0, 15702.0, 23448.0, 34111.0, 49064.0, 68157.0, 88741.0, 108243.0, 118877.0, 117961.0, 104537.0, 84648.0, 63569.0, 45283.0, 31293.0, 21233.0, 14071.0, 9567.0, 6219.0, 4255.0, 2885.0, 1846.0, 1332.0, 843.0, 595.0, 357.0, 243.0, 203.0, 123.0, 72.0, 52.0, 43.0, 18.0, 12.0, 7.0, 4.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.9296875, -3.7982177734375, -3.666748046875, -3.5352783203125, -3.40380859375, -3.2723388671875, -3.140869140625, -3.0093994140625, -2.8779296875, -2.7464599609375, -2.614990234375, -2.4835205078125, -2.35205078125, -2.2205810546875, -2.089111328125, -1.9576416015625, -1.826171875, -1.6947021484375, -1.563232421875, -1.4317626953125, -1.30029296875, -1.1688232421875, -1.037353515625, -0.9058837890625, -0.7744140625, -0.6429443359375, -0.511474609375, -0.3800048828125, -0.24853515625, -0.1170654296875, 0.014404296875, 0.1458740234375, 0.27734375, 0.4088134765625, 0.540283203125, 0.6717529296875, 0.80322265625, 0.9346923828125, 1.066162109375, 1.1976318359375, 1.3291015625, 1.4605712890625, 1.592041015625, 1.7235107421875, 1.85498046875, 1.9864501953125, 2.117919921875, 2.2493896484375, 2.380859375, 2.5123291015625, 2.643798828125, 2.7752685546875, 2.90673828125, 3.0382080078125, 3.169677734375, 3.3011474609375, 3.4326171875, 3.5640869140625, 3.695556640625, 3.8270263671875, 3.95849609375, 4.0899658203125, 4.221435546875, 4.3529052734375, 4.484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 3.0, 5.0, 4.0, 13.0, 11.0, 14.0, 14.0, 18.0, 22.0, 21.0, 29.0, 26.0, 33.0, 29.0, 40.0, 46.0, 45.0, 34.0, 40.0, 38.0, 43.0, 37.0, 36.0, 37.0, 47.0, 35.0, 27.0, 35.0, 36.0, 35.0, 23.0, 20.0, 20.0, 19.0, 15.0, 9.0, 7.0, 8.0, 11.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96875, -3.852203369140625, -3.73565673828125, -3.619110107421875, -3.5025634765625, -3.386016845703125, -3.26947021484375, -3.152923583984375, -3.036376953125, -2.919830322265625, -2.80328369140625, -2.686737060546875, -2.5701904296875, -2.453643798828125, -2.33709716796875, -2.220550537109375, -2.10400390625, -1.987457275390625, -1.87091064453125, -1.754364013671875, -1.6378173828125, -1.521270751953125, -1.40472412109375, -1.288177490234375, -1.171630859375, -1.055084228515625, -0.93853759765625, -0.821990966796875, -0.7054443359375, -0.588897705078125, -0.47235107421875, -0.355804443359375, -0.2392578125, -0.122711181640625, -0.00616455078125, 0.110382080078125, 0.2269287109375, 0.343475341796875, 0.46002197265625, 0.576568603515625, 0.693115234375, 0.809661865234375, 0.92620849609375, 1.042755126953125, 1.1593017578125, 1.275848388671875, 1.39239501953125, 1.508941650390625, 1.62548828125, 1.742034912109375, 1.85858154296875, 1.975128173828125, 2.0916748046875, 2.208221435546875, 2.32476806640625, 2.441314697265625, 2.557861328125, 2.674407958984375, 2.79095458984375, 2.907501220703125, 3.0240478515625, 3.140594482421875, 3.25714111328125, 3.373687744140625, 3.490234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 9.0, 14.0, 19.0, 22.0, 37.0, 53.0, 96.0, 135.0, 225.0, 332.0, 551.0, 924.0, 1546.0, 2523.0, 4647.0, 8459.0, 15996.0, 29696.0, 53980.0, 91814.0, 137956.0, 173458.0, 173022.0, 138636.0, 93366.0, 54934.0, 30228.0, 15990.0, 8612.0, 4637.0, 2611.0, 1568.0, 946.0, 562.0, 330.0, 239.0, 139.0, 89.0, 54.0, 37.0, 21.0, 18.0, 8.0, 3.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9384765625, -1.8738861083984375, -1.809295654296875, -1.7447052001953125, -1.68011474609375, -1.6155242919921875, -1.550933837890625, -1.4863433837890625, -1.4217529296875, -1.3571624755859375, -1.292572021484375, -1.2279815673828125, -1.16339111328125, -1.0988006591796875, -1.034210205078125, -0.9696197509765625, -0.905029296875, -0.8404388427734375, -0.775848388671875, -0.7112579345703125, -0.64666748046875, -0.5820770263671875, -0.517486572265625, -0.4528961181640625, -0.3883056640625, -0.3237152099609375, -0.259124755859375, -0.1945343017578125, -0.12994384765625, -0.0653533935546875, -0.000762939453125, 0.0638275146484375, 0.12841796875, 0.1930084228515625, 0.257598876953125, 0.3221893310546875, 0.38677978515625, 0.4513702392578125, 0.515960693359375, 0.5805511474609375, 0.6451416015625, 0.7097320556640625, 0.774322509765625, 0.8389129638671875, 0.90350341796875, 0.9680938720703125, 1.032684326171875, 1.0972747802734375, 1.161865234375, 1.2264556884765625, 1.291046142578125, 1.3556365966796875, 1.42022705078125, 1.4848175048828125, 1.549407958984375, 1.6139984130859375, 1.6785888671875, 1.7431793212890625, 1.807769775390625, 1.8723602294921875, 1.93695068359375, 2.0015411376953125, 2.066131591796875, 2.1307220458984375, 2.1953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 4.0, 11.0, 7.0, 9.0, 15.0, 22.0, 25.0, 22.0, 26.0, 56.0, 39.0, 42.0, 46.0, 61.0, 46.0, 55.0, 46.0, 56.0, 53.0, 50.0, 50.0, 36.0, 32.0, 28.0, 25.0, 28.0, 13.0, 14.0, 13.0, 16.0, 8.0, 4.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00019919872283935547, -0.00019319169223308563, -0.0001871846616268158, -0.00018117763102054596, -0.00017517060041427612, -0.0001691635698080063, -0.00016315653920173645, -0.00015714950859546661, -0.00015114247798919678, -0.00014513544738292694, -0.0001391284167766571, -0.00013312138617038727, -0.00012711435556411743, -0.0001211073249578476, -0.00011510029435157776, -0.00010909326374530792, -0.00010308623313903809, -9.707920253276825e-05, -9.107217192649841e-05, -8.506514132022858e-05, -7.905811071395874e-05, -7.30510801076889e-05, -6.704404950141907e-05, -6.103701889514923e-05, -5.5029988288879395e-05, -4.902295768260956e-05, -4.301592707633972e-05, -3.7008896470069885e-05, -3.100186586380005e-05, -2.4994835257530212e-05, -1.8987804651260376e-05, -1.298077404499054e-05, -6.973743438720703e-06, -9.667128324508667e-07, 5.04031777381897e-06, 1.1047348380088806e-05, 1.7054378986358643e-05, 2.306140959262848e-05, 2.9068440198898315e-05, 3.507547080516815e-05, 4.108250141143799e-05, 4.7089532017707825e-05, 5.309656262397766e-05, 5.91035932302475e-05, 6.511062383651733e-05, 7.111765444278717e-05, 7.712468504905701e-05, 8.313171565532684e-05, 8.913874626159668e-05, 9.514577686786652e-05, 0.00010115280747413635, 0.00010715983808040619, 0.00011316686868667603, 0.00011917389929294586, 0.0001251809298992157, 0.00013118796050548553, 0.00013719499111175537, 0.0001432020217180252, 0.00014920905232429504, 0.00015521608293056488, 0.00016122311353683472, 0.00016723014414310455, 0.0001732371747493744, 0.00017924420535564423, 0.00018525123596191406]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 12.0, 20.0, 31.0, 32.0, 36.0, 57.0, 76.0, 138.0, 190.0, 267.0, 395.0, 646.0, 1028.0, 1739.0, 2893.0, 4766.0, 8088.0, 13949.0, 22980.0, 37773.0, 59322.0, 86340.0, 115367.0, 136752.0, 141524.0, 125774.0, 99663.0, 70259.0, 46452.0, 28732.0, 17450.0, 10338.0, 6089.0, 3584.0, 2166.0, 1281.0, 807.0, 498.0, 342.0, 206.0, 158.0, 106.0, 72.0, 42.0, 41.0, 20.0, 16.0, 10.0, 7.0, 12.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5720062255859375, -1.519989013671875, -1.4679718017578125, -1.41595458984375, -1.3639373779296875, -1.311920166015625, -1.2599029541015625, -1.2078857421875, -1.1558685302734375, -1.103851318359375, -1.0518341064453125, -0.99981689453125, -0.9477996826171875, -0.895782470703125, -0.8437652587890625, -0.791748046875, -0.7397308349609375, -0.687713623046875, -0.6356964111328125, -0.58367919921875, -0.5316619873046875, -0.479644775390625, -0.4276275634765625, -0.3756103515625, -0.3235931396484375, -0.271575927734375, -0.2195587158203125, -0.16754150390625, -0.1155242919921875, -0.063507080078125, -0.0114898681640625, 0.04052734375, 0.0925445556640625, 0.144561767578125, 0.1965789794921875, 0.24859619140625, 0.3006134033203125, 0.352630615234375, 0.4046478271484375, 0.4566650390625, 0.5086822509765625, 0.560699462890625, 0.6127166748046875, 0.66473388671875, 0.7167510986328125, 0.768768310546875, 0.8207855224609375, 0.872802734375, 0.9248199462890625, 0.976837158203125, 1.0288543701171875, 1.08087158203125, 1.1328887939453125, 1.184906005859375, 1.2369232177734375, 1.2889404296875, 1.3409576416015625, 1.392974853515625, 1.4449920654296875, 1.49700927734375, 1.5490264892578125, 1.601043701171875, 1.6530609130859375, 1.705078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 18.0, 24.0, 23.0, 24.0, 38.0, 33.0, 46.0, 48.0, 71.0, 62.0, 62.0, 71.0, 56.0, 76.0, 43.0, 51.0, 47.0, 29.0, 30.0, 25.0, 13.0, 21.0, 13.0, 8.0, 11.0, 4.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.029296875, -1.0023651123046875, -0.975433349609375, -0.9485015869140625, -0.92156982421875, -0.8946380615234375, -0.867706298828125, -0.8407745361328125, -0.8138427734375, -0.7869110107421875, -0.759979248046875, -0.7330474853515625, -0.70611572265625, -0.6791839599609375, -0.652252197265625, -0.6253204345703125, -0.598388671875, -0.5714569091796875, -0.544525146484375, -0.5175933837890625, -0.49066162109375, -0.4637298583984375, -0.436798095703125, -0.4098663330078125, -0.3829345703125, -0.3560028076171875, -0.329071044921875, -0.3021392822265625, -0.27520751953125, -0.2482757568359375, -0.221343994140625, -0.1944122314453125, -0.16748046875, -0.1405487060546875, -0.113616943359375, -0.0866851806640625, -0.05975341796875, -0.0328216552734375, -0.005889892578125, 0.0210418701171875, 0.0479736328125, 0.0749053955078125, 0.101837158203125, 0.1287689208984375, 0.15570068359375, 0.1826324462890625, 0.209564208984375, 0.2364959716796875, 0.263427734375, 0.2903594970703125, 0.317291259765625, 0.3442230224609375, 0.37115478515625, 0.3980865478515625, 0.425018310546875, 0.4519500732421875, 0.4788818359375, 0.5058135986328125, 0.532745361328125, 0.5596771240234375, 0.58660888671875, 0.6135406494140625, 0.640472412109375, 0.6674041748046875, 0.6943359375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 3.0, 5.0, 17.0, 17.0, 19.0, 23.0, 17.0, 29.0, 28.0, 36.0, 41.0, 49.0, 55.0, 63.0, 48.0, 59.0, 56.0, 43.0, 62.0, 38.0, 48.0, 41.0, 35.0, 24.0, 39.0, 19.0, 11.0, 18.0, 10.0, 8.0, 4.0, 5.0, 6.0, 1.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.248305320739746, -7.039919853210449, -6.831534385681152, -6.623148441314697, -6.4147629737854, -6.2063775062561035, -5.997991561889648, -5.789606094360352, -5.581220626831055, -5.372835159301758, -5.164449691772461, -4.956063747406006, -4.747678279876709, -4.539292812347412, -4.330906867980957, -4.12252140045166, -3.9141359329223633, -3.7057504653930664, -3.4973647594451904, -3.2889790534973145, -3.0805935859680176, -2.8722081184387207, -2.6638224124908447, -2.4554367065429688, -2.247051239013672, -2.038665771484375, -1.830280065536499, -1.6218944787979126, -1.4135088920593262, -1.2051233053207397, -0.9967377185821533, -0.7883521318435669, -0.5799670219421387, -0.37158143520355225, -0.16319584846496582, 0.045189738273620605, 0.25357532501220703, 0.46196091175079346, 0.6703464984893799, 0.8787320852279663, 1.0871176719665527, 1.2955032587051392, 1.5038888454437256, 1.712274432182312, 1.9206600189208984, 2.1290454864501953, 2.3374311923980713, 2.5458168983459473, 2.754202365875244, 2.962587833404541, 3.170973539352417, 3.379359245300293, 3.58774471282959, 3.7961301803588867, 4.004515647888184, 4.212901592254639, 4.4212870597839355, 4.629672527313232, 4.8380584716796875, 5.046443939208984, 5.254829406738281, 5.463214874267578, 5.671600341796875, 5.87998628616333, 6.088371753692627]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 5.0, 4.0, 9.0, 13.0, 13.0, 5.0, 9.0, 18.0, 14.0, 18.0, 28.0, 22.0, 32.0, 33.0, 26.0, 37.0, 28.0, 28.0, 38.0, 32.0, 40.0, 31.0, 39.0, 39.0, 36.0, 29.0, 38.0, 40.0, 34.0, 32.0, 26.0, 26.0, 24.0, 35.0, 13.0, 21.0, 17.0, 10.0, 11.0, 9.0, 5.0, 9.0, 7.0, 2.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.998111724853516, -4.82769775390625, -4.657283782958984, -4.486869812011719, -4.316455841064453, -4.1460418701171875, -3.975627899169922, -3.8052139282226562, -3.6347999572753906, -3.464385986328125, -3.2939720153808594, -3.1235580444335938, -2.953144073486328, -2.7827301025390625, -2.612316131591797, -2.4419021606445312, -2.2714881896972656, -2.10107421875, -1.9306602478027344, -1.7602462768554688, -1.5898323059082031, -1.4194183349609375, -1.2490043640136719, -1.0785903930664062, -0.9081764221191406, -0.737762451171875, -0.5673484802246094, -0.39693450927734375, -0.22652053833007812, -0.0561065673828125, 0.11430740356445312, 0.28472137451171875, 0.4551358222961426, 0.6255497932434082, 0.7959637641906738, 0.9663777351379395, 1.136791706085205, 1.3072056770324707, 1.4776196479797363, 1.648033618927002, 1.8184475898742676, 1.9888615608215332, 2.159275531768799, 2.3296895027160645, 2.50010347366333, 2.6705174446105957, 2.8409314155578613, 3.011345386505127, 3.1817593574523926, 3.352173328399658, 3.522587299346924, 3.6930012702941895, 3.863415241241455, 4.033829212188721, 4.204243183135986, 4.374657154083252, 4.545071125030518, 4.715485095977783, 4.885899066925049, 5.0563130378723145, 5.22672700881958, 5.397140979766846, 5.567554950714111, 5.737968921661377, 5.908382892608643]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 9.0, 10.0, 14.0, 16.0, 24.0, 43.0, 57.0, 95.0, 178.0, 237.0, 458.0, 806.0, 1452.0, 2683.0, 5448.0, 10693.0, 22692.0, 50093.0, 118541.0, 286793.0, 641662.0, 1042924.0, 997989.0, 573025.0, 249927.0, 103014.0, 44727.0, 20425.0, 9826.0, 4861.0, 2409.0, 1332.0, 721.0, 433.0, 254.0, 163.0, 96.0, 54.0, 37.0, 21.0, 12.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51953125, -7.28399658203125, -7.0484619140625, -6.81292724609375, -6.577392578125, -6.34185791015625, -6.1063232421875, -5.87078857421875, -5.63525390625, -5.39971923828125, -5.1641845703125, -4.92864990234375, -4.693115234375, -4.45758056640625, -4.2220458984375, -3.98651123046875, -3.7509765625, -3.51544189453125, -3.2799072265625, -3.04437255859375, -2.808837890625, -2.57330322265625, -2.3377685546875, -2.10223388671875, -1.86669921875, -1.63116455078125, -1.3956298828125, -1.16009521484375, -0.924560546875, -0.68902587890625, -0.4534912109375, -0.21795654296875, 0.017578125, 0.25311279296875, 0.4886474609375, 0.72418212890625, 0.959716796875, 1.19525146484375, 1.4307861328125, 1.66632080078125, 1.90185546875, 2.13739013671875, 2.3729248046875, 2.60845947265625, 2.843994140625, 3.07952880859375, 3.3150634765625, 3.55059814453125, 3.7861328125, 4.02166748046875, 4.2572021484375, 4.49273681640625, 4.728271484375, 4.96380615234375, 5.1993408203125, 5.43487548828125, 5.67041015625, 5.90594482421875, 6.1414794921875, 6.37701416015625, 6.612548828125, 6.84808349609375, 7.0836181640625, 7.31915283203125, 7.5546875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 6.0, 8.0, 7.0, 11.0, 5.0, 12.0, 16.0, 13.0, 23.0, 20.0, 27.0, 26.0, 29.0, 29.0, 25.0, 41.0, 27.0, 34.0, 25.0, 23.0, 33.0, 33.0, 29.0, 30.0, 33.0, 37.0, 41.0, 37.0, 23.0, 35.0, 32.0, 32.0, 20.0, 22.0, 16.0, 20.0, 14.0, 15.0, 15.0, 12.0, 9.0, 6.0, 7.0, 7.0, 8.0, 7.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.15625, -4.01959228515625, -3.8829345703125, -3.74627685546875, -3.609619140625, -3.47296142578125, -3.3363037109375, -3.19964599609375, -3.06298828125, -2.92633056640625, -2.7896728515625, -2.65301513671875, -2.516357421875, -2.37969970703125, -2.2430419921875, -2.10638427734375, -1.9697265625, -1.83306884765625, -1.6964111328125, -1.55975341796875, -1.423095703125, -1.28643798828125, -1.1497802734375, -1.01312255859375, -0.87646484375, -0.73980712890625, -0.6031494140625, -0.46649169921875, -0.329833984375, -0.19317626953125, -0.0565185546875, 0.08013916015625, 0.216796875, 0.35345458984375, 0.4901123046875, 0.62677001953125, 0.763427734375, 0.90008544921875, 1.0367431640625, 1.17340087890625, 1.31005859375, 1.44671630859375, 1.5833740234375, 1.72003173828125, 1.856689453125, 1.99334716796875, 2.1300048828125, 2.26666259765625, 2.4033203125, 2.53997802734375, 2.6766357421875, 2.81329345703125, 2.949951171875, 3.08660888671875, 3.2232666015625, 3.35992431640625, 3.49658203125, 3.63323974609375, 3.7698974609375, 3.90655517578125, 4.043212890625, 4.17987060546875, 4.3165283203125, 4.45318603515625, 4.58984375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 4.0, 5.0, 6.0, 21.0, 33.0, 57.0, 55.0, 93.0, 133.0, 229.0, 346.0, 537.0, 894.0, 1591.0, 2769.0, 4630.0, 8298.0, 15121.0, 27183.0, 49863.0, 91186.0, 167797.0, 296782.0, 484155.0, 680864.0, 748438.0, 626998.0, 424473.0, 250947.0, 140585.0, 76510.0, 41482.0, 22883.0, 12537.0, 6984.0, 3961.0, 2332.0, 1365.0, 816.0, 475.0, 297.0, 167.0, 133.0, 73.0, 59.0, 39.0, 26.0, 14.0, 13.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0], "bins": [-6.1328125, -5.93719482421875, -5.7415771484375, -5.54595947265625, -5.350341796875, -5.15472412109375, -4.9591064453125, -4.76348876953125, -4.56787109375, -4.37225341796875, -4.1766357421875, -3.98101806640625, -3.785400390625, -3.58978271484375, -3.3941650390625, -3.19854736328125, -3.0029296875, -2.80731201171875, -2.6116943359375, -2.41607666015625, -2.220458984375, -2.02484130859375, -1.8292236328125, -1.63360595703125, -1.43798828125, -1.24237060546875, -1.0467529296875, -0.85113525390625, -0.655517578125, -0.45989990234375, -0.2642822265625, -0.06866455078125, 0.126953125, 0.32257080078125, 0.5181884765625, 0.71380615234375, 0.909423828125, 1.10504150390625, 1.3006591796875, 1.49627685546875, 1.69189453125, 1.88751220703125, 2.0831298828125, 2.27874755859375, 2.474365234375, 2.66998291015625, 2.8656005859375, 3.06121826171875, 3.2568359375, 3.45245361328125, 3.6480712890625, 3.84368896484375, 4.039306640625, 4.23492431640625, 4.4305419921875, 4.62615966796875, 4.82177734375, 5.01739501953125, 5.2130126953125, 5.40863037109375, 5.604248046875, 5.79986572265625, 5.9954833984375, 6.19110107421875, 6.38671875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 16.0, 16.0, 14.0, 21.0, 28.0, 43.0, 61.0, 74.0, 94.0, 109.0, 134.0, 156.0, 165.0, 210.0, 229.0, 239.0, 295.0, 273.0, 275.0, 257.0, 246.0, 215.0, 192.0, 156.0, 131.0, 94.0, 93.0, 68.0, 43.0, 38.0, 21.0, 14.0, 14.0, 13.0, 6.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.680389404296875, -2.59515380859375, -2.509918212890625, -2.4246826171875, -2.339447021484375, -2.25421142578125, -2.168975830078125, -2.083740234375, -1.998504638671875, -1.91326904296875, -1.828033447265625, -1.7427978515625, -1.657562255859375, -1.57232666015625, -1.487091064453125, -1.40185546875, -1.316619873046875, -1.23138427734375, -1.146148681640625, -1.0609130859375, -0.975677490234375, -0.89044189453125, -0.805206298828125, -0.719970703125, -0.634735107421875, -0.54949951171875, -0.464263916015625, -0.3790283203125, -0.293792724609375, -0.20855712890625, -0.123321533203125, -0.0380859375, 0.047149658203125, 0.13238525390625, 0.217620849609375, 0.3028564453125, 0.388092041015625, 0.47332763671875, 0.558563232421875, 0.643798828125, 0.729034423828125, 0.81427001953125, 0.899505615234375, 0.9847412109375, 1.069976806640625, 1.15521240234375, 1.240447998046875, 1.32568359375, 1.410919189453125, 1.49615478515625, 1.581390380859375, 1.6666259765625, 1.751861572265625, 1.83709716796875, 1.922332763671875, 2.007568359375, 2.092803955078125, 2.17803955078125, 2.263275146484375, 2.3485107421875, 2.433746337890625, 2.51898193359375, 2.604217529296875, 2.689453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 9.0, 3.0, 1.0, 12.0, 14.0, 18.0, 16.0, 22.0, 25.0, 29.0, 46.0, 44.0, 45.0, 43.0, 53.0, 59.0, 62.0, 55.0, 56.0, 63.0, 59.0, 45.0, 42.0, 49.0, 30.0, 24.0, 18.0, 12.0, 9.0, 7.0, 14.0, 10.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.243093967437744, -7.009957790374756, -6.776822090148926, -6.5436859130859375, -6.310549736022949, -6.077413558959961, -5.844277858734131, -5.611141681671143, -5.3780059814453125, -5.144869804382324, -4.911734104156494, -4.678597927093506, -4.445461750030518, -4.2123260498046875, -3.979189872741699, -3.746053695678711, -3.5129175186157227, -3.2797815799713135, -3.046645402908325, -2.813509464263916, -2.5803732872009277, -2.3472373485565186, -2.1141014099121094, -1.8809653520584106, -1.647829294204712, -1.4146932363510132, -1.1815571784973145, -0.9484212398529053, -0.7152851819992065, -0.4821491241455078, -0.24901318550109863, -0.015877127647399902, 0.21725845336914062, 0.45039448142051697, 0.6835305094718933, 0.9166665077209473, 1.149802565574646, 1.3829386234283447, 1.616074562072754, 1.8492106199264526, 2.0823466777801514, 2.3154826164245605, 2.548618793487549, 2.781754732131958, 3.014890670776367, 3.2480268478393555, 3.4811627864837646, 3.714298725128174, 3.947434902191162, 4.18057107925415, 4.4137067794799805, 4.646842956542969, 4.879979133605957, 5.113115310668945, 5.346251010894775, 5.579387187957764, 5.812522888183594, 6.045659065246582, 6.278794765472412, 6.5119309425354, 6.745067119598389, 6.978202819824219, 7.211338996887207, 7.444475173950195, 7.677611351013184]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 9.0, 5.0, 6.0, 15.0, 16.0, 27.0, 16.0, 23.0, 26.0, 25.0, 22.0, 30.0, 34.0, 25.0, 41.0, 25.0, 46.0, 36.0, 45.0, 39.0, 41.0, 33.0, 36.0, 46.0, 30.0, 42.0, 32.0, 26.0, 17.0, 19.0, 21.0, 22.0, 17.0, 24.0, 21.0, 7.0, 9.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-5.597845554351807, -5.423863887786865, -5.249881744384766, -5.075900077819824, -4.901918411254883, -4.727936267852783, -4.553954601287842, -4.379972457885742, -4.205990791320801, -4.032009124755859, -3.8580269813537598, -3.6840453147888184, -3.510063409805298, -3.3360815048217773, -3.162099838256836, -2.9881179332733154, -2.814136028289795, -2.6401541233062744, -2.466172218322754, -2.2921905517578125, -2.118208646774292, -1.9442267417907715, -1.7702449560165405, -1.5962631702423096, -1.422281265258789, -1.2482993602752686, -1.0743175745010376, -0.9003357291221619, -0.7263538837432861, -0.5523720383644104, -0.37839019298553467, -0.2044084072113037, -0.030426025390625, 0.14355581998825073, 0.31753766536712646, 0.4915195107460022, 0.6655013561248779, 0.8394832015037537, 1.0134650468826294, 1.1874468326568604, 1.3614287376403809, 1.5354106426239014, 1.7093924283981323, 1.8833742141723633, 2.057356119155884, 2.2313380241394043, 2.4053196907043457, 2.579301595687866, 2.7532835006713867, 2.9272654056549072, 3.1012473106384277, 3.275228977203369, 3.4492108821868896, 3.62319278717041, 3.7971744537353516, 3.971156358718872, 4.145138263702393, 4.319119930267334, 4.493102073669434, 4.667083740234375, 4.841065406799316, 5.015047550201416, 5.189029216766357, 5.363011360168457, 5.536993026733398]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 12.0, 21.0, 20.0, 25.0, 34.0, 44.0, 60.0, 91.0, 167.0, 203.0, 298.0, 432.0, 665.0, 1097.0, 1671.0, 2571.0, 4147.0, 6580.0, 10538.0, 16909.0, 27930.0, 47142.0, 77461.0, 123081.0, 172608.0, 181234.0, 140155.0, 91363.0, 55394.0, 33245.0, 19924.0, 12258.0, 7746.0, 4854.0, 2998.0, 1883.0, 1210.0, 850.0, 510.0, 351.0, 219.0, 149.0, 122.0, 66.0, 59.0, 46.0, 31.0, 25.0, 17.0, 11.0, 7.0, 8.0, 3.0, 3.0, 5.0], "bins": [-1.6572265625, -1.6087188720703125, -1.560211181640625, -1.5117034912109375, -1.46319580078125, -1.4146881103515625, -1.366180419921875, -1.3176727294921875, -1.2691650390625, -1.2206573486328125, -1.172149658203125, -1.1236419677734375, -1.07513427734375, -1.0266265869140625, -0.978118896484375, -0.9296112060546875, -0.881103515625, -0.8325958251953125, -0.784088134765625, -0.7355804443359375, -0.68707275390625, -0.6385650634765625, -0.590057373046875, -0.5415496826171875, -0.4930419921875, -0.4445343017578125, -0.396026611328125, -0.3475189208984375, -0.29901123046875, -0.2505035400390625, -0.201995849609375, -0.1534881591796875, -0.10498046875, -0.0564727783203125, -0.007965087890625, 0.0405426025390625, 0.08905029296875, 0.1375579833984375, 0.186065673828125, 0.2345733642578125, 0.2830810546875, 0.3315887451171875, 0.380096435546875, 0.4286041259765625, 0.47711181640625, 0.5256195068359375, 0.574127197265625, 0.6226348876953125, 0.671142578125, 0.7196502685546875, 0.768157958984375, 0.8166656494140625, 0.86517333984375, 0.9136810302734375, 0.962188720703125, 1.0106964111328125, 1.0592041015625, 1.1077117919921875, 1.156219482421875, 1.2047271728515625, 1.25323486328125, 1.3017425537109375, 1.350250244140625, 1.3987579345703125, 1.447265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 9.0, 4.0, 9.0, 13.0, 6.0, 18.0, 18.0, 20.0, 30.0, 37.0, 19.0, 38.0, 34.0, 27.0, 46.0, 30.0, 56.0, 38.0, 55.0, 59.0, 40.0, 39.0, 33.0, 52.0, 35.0, 29.0, 31.0, 24.0, 20.0, 15.0, 24.0, 17.0, 27.0, 10.0, 8.0, 8.0, 10.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.03515625, -6.828125, -6.62109375, -6.4140625, -6.20703125, -6.0, -5.79296875, -5.5859375, -5.37890625, -5.171875, -4.96484375, -4.7578125, -4.55078125, -4.34375, -4.13671875, -3.9296875, -3.72265625, -3.515625, -3.30859375, -3.1015625, -2.89453125, -2.6875, -2.48046875, -2.2734375, -2.06640625, -1.859375, -1.65234375, -1.4453125, -1.23828125, -1.03125, -0.82421875, -0.6171875, -0.41015625, -0.203125, 0.00390625, 0.2109375, 0.41796875, 0.625, 0.83203125, 1.0390625, 1.24609375, 1.453125, 1.66015625, 1.8671875, 2.07421875, 2.28125, 2.48828125, 2.6953125, 2.90234375, 3.109375, 3.31640625, 3.5234375, 3.73046875, 3.9375, 4.14453125, 4.3515625, 4.55859375, 4.765625, 4.97265625, 5.1796875, 5.38671875, 5.59375, 5.80078125, 6.0078125, 6.21484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 7.0, 11.0, 12.0, 21.0, 27.0, 13.0, 37.0, 50.0, 65.0, 80.0, 104.0, 178.0, 256.0, 394.0, 552.0, 904.0, 1504.0, 2513.0, 4656.0, 8168.0, 15901.0, 32669.0, 420465.0, 489921.0, 34010.0, 16089.0, 8493.0, 4517.0, 2585.0, 1610.0, 994.0, 559.0, 368.0, 248.0, 160.0, 96.0, 81.0, 60.0, 41.0, 28.0, 17.0, 15.0, 20.0, 9.0, 8.0, 9.0, 4.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.0625, -4.9091796875, -4.755859375, -4.6025390625, -4.44921875, -4.2958984375, -4.142578125, -3.9892578125, -3.8359375, -3.6826171875, -3.529296875, -3.3759765625, -3.22265625, -3.0693359375, -2.916015625, -2.7626953125, -2.609375, -2.4560546875, -2.302734375, -2.1494140625, -1.99609375, -1.8427734375, -1.689453125, -1.5361328125, -1.3828125, -1.2294921875, -1.076171875, -0.9228515625, -0.76953125, -0.6162109375, -0.462890625, -0.3095703125, -0.15625, -0.0029296875, 0.150390625, 0.3037109375, 0.45703125, 0.6103515625, 0.763671875, 0.9169921875, 1.0703125, 1.2236328125, 1.376953125, 1.5302734375, 1.68359375, 1.8369140625, 1.990234375, 2.1435546875, 2.296875, 2.4501953125, 2.603515625, 2.7568359375, 2.91015625, 3.0634765625, 3.216796875, 3.3701171875, 3.5234375, 3.6767578125, 3.830078125, 3.9833984375, 4.13671875, 4.2900390625, 4.443359375, 4.5966796875, 4.75]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 5.0, 9.0, 10.0, 8.0, 11.0, 6.0, 16.0, 20.0, 19.0, 30.0, 26.0, 35.0, 31.0, 25.0, 38.0, 42.0, 49.0, 39.0, 39.0, 45.0, 51.0, 42.0, 42.0, 44.0, 40.0, 35.0, 36.0, 34.0, 26.0, 17.0, 32.0, 18.0, 18.0, 12.0, 11.0, 10.0, 4.0, 10.0, 6.0, 5.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9296875, -4.78515625, -4.640625, -4.49609375, -4.3515625, -4.20703125, -4.0625, -3.91796875, -3.7734375, -3.62890625, -3.484375, -3.33984375, -3.1953125, -3.05078125, -2.90625, -2.76171875, -2.6171875, -2.47265625, -2.328125, -2.18359375, -2.0390625, -1.89453125, -1.75, -1.60546875, -1.4609375, -1.31640625, -1.171875, -1.02734375, -0.8828125, -0.73828125, -0.59375, -0.44921875, -0.3046875, -0.16015625, -0.015625, 0.12890625, 0.2734375, 0.41796875, 0.5625, 0.70703125, 0.8515625, 0.99609375, 1.140625, 1.28515625, 1.4296875, 1.57421875, 1.71875, 1.86328125, 2.0078125, 2.15234375, 2.296875, 2.44140625, 2.5859375, 2.73046875, 2.875, 3.01953125, 3.1640625, 3.30859375, 3.453125, 3.59765625, 3.7421875, 3.88671875, 4.03125, 4.17578125, 4.3203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 15.0, 21.0, 19.0, 23.0, 36.0, 50.0, 86.0, 110.0, 165.0, 215.0, 309.0, 484.0, 696.0, 1096.0, 1769.0, 3096.0, 5531.0, 11253.0, 26089.0, 157495.0, 765778.0, 41108.0, 15573.0, 7450.0, 3937.0, 2227.0, 1348.0, 863.0, 501.0, 339.0, 241.0, 204.0, 122.0, 94.0, 54.0, 31.0, 36.0, 32.0, 14.0, 7.0, 10.0, 6.0, 6.0, 3.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.488037109375, -0.4724006652832031, -0.45676422119140625, -0.4411277770996094, -0.4254913330078125, -0.4098548889160156, -0.39421844482421875, -0.3785820007324219, -0.362945556640625, -0.3473091125488281, -0.33167266845703125, -0.3160362243652344, -0.3003997802734375, -0.2847633361816406, -0.26912689208984375, -0.2534904479980469, -0.23785400390625, -0.22221755981445312, -0.20658111572265625, -0.19094467163085938, -0.1753082275390625, -0.15967178344726562, -0.14403533935546875, -0.12839889526367188, -0.112762451171875, -0.09712600708007812, -0.08148956298828125, -0.06585311889648438, -0.0502166748046875, -0.034580230712890625, -0.01894378662109375, -0.003307342529296875, 0.0123291015625, 0.027965545654296875, 0.04360198974609375, 0.059238433837890625, 0.0748748779296875, 0.09051132202148438, 0.10614776611328125, 0.12178421020507812, 0.137420654296875, 0.15305709838867188, 0.16869354248046875, 0.18432998657226562, 0.1999664306640625, 0.21560287475585938, 0.23123931884765625, 0.24687576293945312, 0.26251220703125, 0.2781486511230469, 0.29378509521484375, 0.3094215393066406, 0.3250579833984375, 0.3406944274902344, 0.35633087158203125, 0.3719673156738281, 0.387603759765625, 0.4032402038574219, 0.41887664794921875, 0.4345130920410156, 0.4501495361328125, 0.4657859802246094, 0.48142242431640625, 0.4970588684082031, 0.5126953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 1.0, 7.0, 3.0, 8.0, 5.0, 9.0, 20.0, 12.0, 25.0, 32.0, 20.0, 36.0, 51.0, 53.0, 42.0, 68.0, 74.0, 70.0, 53.0, 67.0, 43.0, 47.0, 53.0, 37.0, 28.0, 22.0, 32.0, 17.0, 17.0, 15.0, 5.0, 5.0, 3.0, 10.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5272369384765625e-05, -2.4477019906044006e-05, -2.3681670427322388e-05, -2.288632094860077e-05, -2.209097146987915e-05, -2.1295621991157532e-05, -2.0500272512435913e-05, -1.9704923033714294e-05, -1.8909573554992676e-05, -1.8114224076271057e-05, -1.731887459754944e-05, -1.652352511882782e-05, -1.57281756401062e-05, -1.4932826161384583e-05, -1.4137476682662964e-05, -1.3342127203941345e-05, -1.2546777725219727e-05, -1.1751428246498108e-05, -1.095607876777649e-05, -1.016072928905487e-05, -9.365379810333252e-06, -8.570030331611633e-06, -7.774680852890015e-06, -6.979331374168396e-06, -6.183981895446777e-06, -5.388632416725159e-06, -4.59328293800354e-06, -3.7979334592819214e-06, -3.0025839805603027e-06, -2.207234501838684e-06, -1.4118850231170654e-06, -6.165355443954468e-07, 1.7881393432617188e-07, 9.741634130477905e-07, 1.7695128917694092e-06, 2.564862370491028e-06, 3.3602118492126465e-06, 4.155561327934265e-06, 4.950910806655884e-06, 5.7462602853775024e-06, 6.541609764099121e-06, 7.33695924282074e-06, 8.132308721542358e-06, 8.927658200263977e-06, 9.723007678985596e-06, 1.0518357157707214e-05, 1.1313706636428833e-05, 1.2109056115150452e-05, 1.290440559387207e-05, 1.3699755072593689e-05, 1.4495104551315308e-05, 1.5290454030036926e-05, 1.6085803508758545e-05, 1.6881152987480164e-05, 1.7676502466201782e-05, 1.84718519449234e-05, 1.926720142364502e-05, 2.0062550902366638e-05, 2.0857900381088257e-05, 2.1653249859809875e-05, 2.2448599338531494e-05, 2.3243948817253113e-05, 2.403929829597473e-05, 2.483464777469635e-05, 2.562999725341797e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 4.0, 10.0, 13.0, 25.0, 25.0, 44.0, 68.0, 105.0, 168.0, 258.0, 380.0, 558.0, 839.0, 1374.0, 2024.0, 3166.0, 5059.0, 7583.0, 11755.0, 18791.0, 31106.0, 52840.0, 95719.0, 163047.0, 216773.0, 178001.0, 107298.0, 59574.0, 34667.0, 20934.0, 12821.0, 8211.0, 5422.0, 3460.0, 2211.0, 1458.0, 911.0, 584.0, 411.0, 280.0, 197.0, 121.0, 80.0, 42.0, 42.0, 27.0, 12.0, 20.0, 19.0, 3.0, 3.0, 10.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.4501953125, -0.4363861083984375, -0.422576904296875, -0.4087677001953125, -0.39495849609375, -0.3811492919921875, -0.367340087890625, -0.3535308837890625, -0.3397216796875, -0.3259124755859375, -0.312103271484375, -0.2982940673828125, -0.28448486328125, -0.2706756591796875, -0.256866455078125, -0.2430572509765625, -0.229248046875, -0.2154388427734375, -0.201629638671875, -0.1878204345703125, -0.17401123046875, -0.1602020263671875, -0.146392822265625, -0.1325836181640625, -0.1187744140625, -0.1049652099609375, -0.091156005859375, -0.0773468017578125, -0.06353759765625, -0.0497283935546875, -0.035919189453125, -0.0221099853515625, -0.00830078125, 0.0055084228515625, 0.019317626953125, 0.0331268310546875, 0.04693603515625, 0.0607452392578125, 0.074554443359375, 0.0883636474609375, 0.1021728515625, 0.1159820556640625, 0.129791259765625, 0.1436004638671875, 0.15740966796875, 0.1712188720703125, 0.185028076171875, 0.1988372802734375, 0.212646484375, 0.2264556884765625, 0.240264892578125, 0.2540740966796875, 0.26788330078125, 0.2816925048828125, 0.295501708984375, 0.3093109130859375, 0.3231201171875, 0.3369293212890625, 0.350738525390625, 0.3645477294921875, 0.37835693359375, 0.3921661376953125, 0.405975341796875, 0.4197845458984375, 0.43359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 3.0, 6.0, 4.0, 10.0, 11.0, 22.0, 18.0, 21.0, 21.0, 36.0, 37.0, 29.0, 31.0, 60.0, 61.0, 70.0, 68.0, 69.0, 70.0, 60.0, 47.0, 38.0, 38.0, 19.0, 27.0, 26.0, 14.0, 17.0, 16.0, 10.0, 9.0, 7.0, 5.0, 4.0, 2.0, 6.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1629638671875, -0.15761756896972656, -0.15227127075195312, -0.1469249725341797, -0.14157867431640625, -0.1362323760986328, -0.13088607788085938, -0.12553977966308594, -0.1201934814453125, -0.11484718322753906, -0.10950088500976562, -0.10415458679199219, -0.09880828857421875, -0.09346199035644531, -0.08811569213867188, -0.08276939392089844, -0.077423095703125, -0.07207679748535156, -0.06673049926757812, -0.06138420104980469, -0.05603790283203125, -0.05069160461425781, -0.045345306396484375, -0.03999900817871094, -0.0346527099609375, -0.029306411743164062, -0.023960113525390625, -0.018613815307617188, -0.01326751708984375, -0.007921218872070312, -0.002574920654296875, 0.0027713775634765625, 0.00811767578125, 0.013463973999023438, 0.018810272216796875, 0.024156570434570312, 0.02950286865234375, 0.03484916687011719, 0.040195465087890625, 0.04554176330566406, 0.0508880615234375, 0.05623435974121094, 0.061580657958984375, 0.06692695617675781, 0.07227325439453125, 0.07761955261230469, 0.08296585083007812, 0.08831214904785156, 0.093658447265625, 0.09900474548339844, 0.10435104370117188, 0.10969734191894531, 0.11504364013671875, 0.12038993835449219, 0.12573623657226562, 0.13108253479003906, 0.1364288330078125, 0.14177513122558594, 0.14712142944335938, 0.1524677276611328, 0.15781402587890625, 0.1631603240966797, 0.16850662231445312, 0.17385292053222656, 0.17919921875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 5.0, 7.0, 13.0, 15.0, 19.0, 20.0, 27.0, 25.0, 41.0, 47.0, 48.0, 45.0, 50.0, 56.0, 57.0, 60.0, 59.0, 67.0, 51.0, 44.0, 49.0, 49.0, 30.0, 26.0, 18.0, 13.0, 7.0, 11.0, 13.0, 9.0, 10.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.190295696258545, -6.9590349197387695, -6.727774620056152, -6.496514320373535, -6.26525354385376, -6.033992767333984, -5.802732467651367, -5.57147216796875, -5.340211391448975, -5.108950614929199, -4.877690315246582, -4.646430015563965, -4.4151692390441895, -4.183908462524414, -3.952648162841797, -3.7213876247406006, -3.4901270866394043, -3.258866548538208, -3.0276060104370117, -2.7963454723358154, -2.565084934234619, -2.333824396133423, -2.1025638580322266, -1.8713033199310303, -1.640042781829834, -1.4087822437286377, -1.1775217056274414, -0.9462611675262451, -0.7150006294250488, -0.48374009132385254, -0.25247955322265625, -0.02121901512145996, 0.21004199981689453, 0.4413025379180908, 0.6725630760192871, 0.9038236141204834, 1.1350841522216797, 1.366344690322876, 1.5976052284240723, 1.8288657665252686, 2.060126304626465, 2.291386842727661, 2.5226473808288574, 2.7539079189300537, 2.98516845703125, 3.2164289951324463, 3.4476895332336426, 3.678950071334839, 3.910210609436035, 4.141470909118652, 4.372731685638428, 4.603992462158203, 4.83525276184082, 5.0665130615234375, 5.297773838043213, 5.529034614562988, 5.7602949142456055, 5.991555213928223, 6.222815990447998, 6.454076766967773, 6.685337066650391, 6.916597366333008, 7.147858142852783, 7.379118919372559, 7.610379219055176]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 11.0, 4.0, 6.0, 18.0, 12.0, 24.0, 16.0, 26.0, 23.0, 27.0, 24.0, 27.0, 30.0, 38.0, 27.0, 32.0, 46.0, 31.0, 49.0, 39.0, 37.0, 39.0, 39.0, 44.0, 34.0, 37.0, 36.0, 23.0, 15.0, 21.0, 18.0, 28.0, 19.0, 21.0, 16.0, 14.0, 7.0, 4.0, 8.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.641003608703613, -5.4663920402526855, -5.291780948638916, -5.117169380187988, -4.9425578117370605, -4.767946720123291, -4.593335151672363, -4.418724060058594, -4.244112491607666, -4.069500923156738, -3.8948895931243896, -3.720278263092041, -3.5456669330596924, -3.3710556030273438, -3.196444034576416, -3.0218327045440674, -2.8472211360931396, -2.672609806060791, -2.4979982376098633, -2.3233869075775146, -2.148775577545166, -1.9741641283035278, -1.7995526790618896, -1.624941349029541, -1.4503298997879028, -1.2757184505462646, -1.101107120513916, -0.9264956712722778, -0.7518842816352844, -0.577272891998291, -0.40266144275665283, -0.2280501127243042, -0.053438663482666016, 0.12117274105548859, 0.2957841455936432, 0.470395565032959, 0.6450069546699524, 0.8196183443069458, 0.994229793548584, 1.1688411235809326, 1.3434525728225708, 1.518064022064209, 1.6926753520965576, 1.8672868013381958, 2.041898250579834, 2.2165095806121826, 2.3911209106445312, 2.565732479095459, 2.7403438091278076, 2.9149551391601562, 3.089566707611084, 3.2641780376434326, 3.4387893676757812, 3.613400936126709, 3.7880122661590576, 3.9626235961914062, 4.137235164642334, 4.311846733093262, 4.486457824707031, 4.661069393157959, 4.835680961608887, 5.010292053222656, 5.184903621673584, 5.359515190124512, 5.534126281738281]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 11.0, 25.0, 37.0, 52.0, 69.0, 107.0, 169.0, 227.0, 355.0, 493.0, 696.0, 1038.0, 1469.0, 2227.0, 3347.0, 4893.0, 7466.0, 10678.0, 15861.0, 23641.0, 34064.0, 49443.0, 68513.0, 90151.0, 109459.0, 120339.0, 117991.0, 103245.0, 82443.0, 61565.0, 43704.0, 30425.0, 20978.0, 13976.0, 9516.0, 6433.0, 4364.0, 2899.0, 1989.0, 1360.0, 907.0, 628.0, 402.0, 304.0, 193.0, 129.0, 95.0, 58.0, 38.0, 29.0, 21.0, 8.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0], "bins": [-3.955078125, -3.830841064453125, -3.70660400390625, -3.582366943359375, -3.4581298828125, -3.333892822265625, -3.20965576171875, -3.085418701171875, -2.961181640625, -2.836944580078125, -2.71270751953125, -2.588470458984375, -2.4642333984375, -2.339996337890625, -2.21575927734375, -2.091522216796875, -1.96728515625, -1.843048095703125, -1.71881103515625, -1.594573974609375, -1.4703369140625, -1.346099853515625, -1.22186279296875, -1.097625732421875, -0.973388671875, -0.849151611328125, -0.72491455078125, -0.600677490234375, -0.4764404296875, -0.352203369140625, -0.22796630859375, -0.103729248046875, 0.0205078125, 0.144744873046875, 0.26898193359375, 0.393218994140625, 0.5174560546875, 0.641693115234375, 0.76593017578125, 0.890167236328125, 1.014404296875, 1.138641357421875, 1.26287841796875, 1.387115478515625, 1.5113525390625, 1.635589599609375, 1.75982666015625, 1.884063720703125, 2.00830078125, 2.132537841796875, 2.25677490234375, 2.381011962890625, 2.5052490234375, 2.629486083984375, 2.75372314453125, 2.877960205078125, 3.002197265625, 3.126434326171875, 3.25067138671875, 3.374908447265625, 3.4991455078125, 3.623382568359375, 3.74761962890625, 3.871856689453125, 3.99609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 2.0, 2.0, 8.0, 13.0, 10.0, 13.0, 15.0, 16.0, 21.0, 17.0, 20.0, 16.0, 30.0, 36.0, 28.0, 32.0, 25.0, 34.0, 34.0, 35.0, 39.0, 34.0, 36.0, 42.0, 47.0, 39.0, 35.0, 34.0, 38.0, 28.0, 31.0, 20.0, 26.0, 24.0, 18.0, 11.0, 19.0, 13.0, 12.0, 10.0, 6.0, 12.0, 6.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-5.9609375, -5.78546142578125, -5.6099853515625, -5.43450927734375, -5.259033203125, -5.08355712890625, -4.9080810546875, -4.73260498046875, -4.55712890625, -4.38165283203125, -4.2061767578125, -4.03070068359375, -3.855224609375, -3.67974853515625, -3.5042724609375, -3.32879638671875, -3.1533203125, -2.97784423828125, -2.8023681640625, -2.62689208984375, -2.451416015625, -2.27593994140625, -2.1004638671875, -1.92498779296875, -1.74951171875, -1.57403564453125, -1.3985595703125, -1.22308349609375, -1.047607421875, -0.87213134765625, -0.6966552734375, -0.52117919921875, -0.345703125, -0.17022705078125, 0.0052490234375, 0.18072509765625, 0.356201171875, 0.53167724609375, 0.7071533203125, 0.88262939453125, 1.05810546875, 1.23358154296875, 1.4090576171875, 1.58453369140625, 1.760009765625, 1.93548583984375, 2.1109619140625, 2.28643798828125, 2.4619140625, 2.63739013671875, 2.8128662109375, 2.98834228515625, 3.163818359375, 3.33929443359375, 3.5147705078125, 3.69024658203125, 3.86572265625, 4.04119873046875, 4.2166748046875, 4.39215087890625, 4.567626953125, 4.74310302734375, 4.9185791015625, 5.09405517578125, 5.26953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 13.0, 22.0, 30.0, 36.0, 75.0, 148.0, 229.0, 405.0, 710.0, 1218.0, 2191.0, 4072.0, 7926.0, 15202.0, 29687.0, 57120.0, 102684.0, 162123.0, 200741.0, 183630.0, 126369.0, 73062.0, 38701.0, 19991.0, 10369.0, 5265.0, 2895.0, 1581.0, 887.0, 482.0, 283.0, 156.0, 85.0, 49.0, 39.0, 21.0, 17.0, 6.0, 8.0, 4.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.078125, -6.8548583984375, -6.631591796875, -6.4083251953125, -6.18505859375, -5.9617919921875, -5.738525390625, -5.5152587890625, -5.2919921875, -5.0687255859375, -4.845458984375, -4.6221923828125, -4.39892578125, -4.1756591796875, -3.952392578125, -3.7291259765625, -3.505859375, -3.2825927734375, -3.059326171875, -2.8360595703125, -2.61279296875, -2.3895263671875, -2.166259765625, -1.9429931640625, -1.7197265625, -1.4964599609375, -1.273193359375, -1.0499267578125, -0.82666015625, -0.6033935546875, -0.380126953125, -0.1568603515625, 0.06640625, 0.2896728515625, 0.512939453125, 0.7362060546875, 0.95947265625, 1.1827392578125, 1.406005859375, 1.6292724609375, 1.8525390625, 2.0758056640625, 2.299072265625, 2.5223388671875, 2.74560546875, 2.9688720703125, 3.192138671875, 3.4154052734375, 3.638671875, 3.8619384765625, 4.085205078125, 4.3084716796875, 4.53173828125, 4.7550048828125, 4.978271484375, 5.2015380859375, 5.4248046875, 5.6480712890625, 5.871337890625, 6.0946044921875, 6.31787109375, 6.5411376953125, 6.764404296875, 6.9876708984375, 7.2109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 15.0, 18.0, 20.0, 20.0, 33.0, 32.0, 34.0, 45.0, 35.0, 43.0, 48.0, 46.0, 52.0, 58.0, 46.0, 58.0, 41.0, 51.0, 38.0, 45.0, 39.0, 33.0, 20.0, 22.0, 20.0, 13.0, 13.0, 9.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.12109375, -4.97491455078125, -4.8287353515625, -4.68255615234375, -4.536376953125, -4.39019775390625, -4.2440185546875, -4.09783935546875, -3.95166015625, -3.80548095703125, -3.6593017578125, -3.51312255859375, -3.366943359375, -3.22076416015625, -3.0745849609375, -2.92840576171875, -2.7822265625, -2.63604736328125, -2.4898681640625, -2.34368896484375, -2.197509765625, -2.05133056640625, -1.9051513671875, -1.75897216796875, -1.61279296875, -1.46661376953125, -1.3204345703125, -1.17425537109375, -1.028076171875, -0.88189697265625, -0.7357177734375, -0.58953857421875, -0.443359375, -0.29718017578125, -0.1510009765625, -0.00482177734375, 0.141357421875, 0.28753662109375, 0.4337158203125, 0.57989501953125, 0.72607421875, 0.87225341796875, 1.0184326171875, 1.16461181640625, 1.310791015625, 1.45697021484375, 1.6031494140625, 1.74932861328125, 1.8955078125, 2.04168701171875, 2.1878662109375, 2.33404541015625, 2.480224609375, 2.62640380859375, 2.7725830078125, 2.91876220703125, 3.06494140625, 3.21112060546875, 3.3572998046875, 3.50347900390625, 3.649658203125, 3.79583740234375, 3.9420166015625, 4.08819580078125, 4.234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 7.0, 15.0, 21.0, 25.0, 31.0, 55.0, 76.0, 140.0, 202.0, 299.0, 455.0, 764.0, 1284.0, 2135.0, 3677.0, 6155.0, 10652.0, 18452.0, 31710.0, 51895.0, 81941.0, 117265.0, 146576.0, 155428.0, 138335.0, 104726.0, 70227.0, 43600.0, 25784.0, 15084.0, 8752.0, 5124.0, 2998.0, 1753.0, 1135.0, 673.0, 374.0, 250.0, 178.0, 75.0, 73.0, 56.0, 31.0, 31.0, 18.0, 9.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7080078125, -1.653472900390625, -1.59893798828125, -1.544403076171875, -1.4898681640625, -1.435333251953125, -1.38079833984375, -1.326263427734375, -1.271728515625, -1.217193603515625, -1.16265869140625, -1.108123779296875, -1.0535888671875, -0.999053955078125, -0.94451904296875, -0.889984130859375, -0.83544921875, -0.780914306640625, -0.72637939453125, -0.671844482421875, -0.6173095703125, -0.562774658203125, -0.50823974609375, -0.453704833984375, -0.399169921875, -0.344635009765625, -0.29010009765625, -0.235565185546875, -0.1810302734375, -0.126495361328125, -0.07196044921875, -0.017425537109375, 0.037109375, 0.091644287109375, 0.14617919921875, 0.200714111328125, 0.2552490234375, 0.309783935546875, 0.36431884765625, 0.418853759765625, 0.473388671875, 0.527923583984375, 0.58245849609375, 0.636993408203125, 0.6915283203125, 0.746063232421875, 0.80059814453125, 0.855133056640625, 0.90966796875, 0.964202880859375, 1.01873779296875, 1.073272705078125, 1.1278076171875, 1.182342529296875, 1.23687744140625, 1.291412353515625, 1.345947265625, 1.400482177734375, 1.45501708984375, 1.509552001953125, 1.5640869140625, 1.618621826171875, 1.67315673828125, 1.727691650390625, 1.7822265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 16.0, 13.0, 21.0, 15.0, 29.0, 27.0, 43.0, 40.0, 45.0, 42.0, 46.0, 60.0, 67.0, 72.0, 51.0, 66.0, 56.0, 46.0, 46.0, 43.0, 34.0, 17.0, 16.0, 28.0, 19.0, 12.0, 5.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001989603042602539, -0.00019226036965847015, -0.0001855604350566864, -0.00017886050045490265, -0.0001721605658531189, -0.00016546063125133514, -0.0001587606966495514, -0.00015206076204776764, -0.0001453608274459839, -0.00013866089284420013, -0.00013196095824241638, -0.00012526102364063263, -0.00011856108903884888, -0.00011186115443706512, -0.00010516121983528137, -9.846128523349762e-05, -9.176135063171387e-05, -8.506141602993011e-05, -7.836148142814636e-05, -7.166154682636261e-05, -6.496161222457886e-05, -5.8261677622795105e-05, -5.156174302101135e-05, -4.48618084192276e-05, -3.816187381744385e-05, -3.1461939215660095e-05, -2.4762004613876343e-05, -1.806207001209259e-05, -1.1362135410308838e-05, -4.6622008085250854e-06, 2.037733793258667e-06, 8.73766839504242e-06, 1.5437602996826172e-05, 2.2137537598609924e-05, 2.8837472200393677e-05, 3.553740680217743e-05, 4.223734140396118e-05, 4.8937276005744934e-05, 5.5637210607528687e-05, 6.233714520931244e-05, 6.903707981109619e-05, 7.573701441287994e-05, 8.24369490146637e-05, 8.913688361644745e-05, 9.58368182182312e-05, 0.00010253675282001495, 0.0001092366874217987, 0.00011593662202358246, 0.0001226365566253662, 0.00012933649122714996, 0.00013603642582893372, 0.00014273636043071747, 0.00014943629503250122, 0.00015613622963428497, 0.00016283616423606873, 0.00016953609883785248, 0.00017623603343963623, 0.00018293596804141998, 0.00018963590264320374, 0.0001963358372449875, 0.00020303577184677124, 0.000209735706448555, 0.00021643564105033875, 0.0002231355756521225, 0.00022983551025390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 11.0, 13.0, 18.0, 9.0, 25.0, 53.0, 59.0, 85.0, 134.0, 174.0, 313.0, 431.0, 649.0, 993.0, 1488.0, 2272.0, 3510.0, 5728.0, 9176.0, 14600.0, 23583.0, 37281.0, 56714.0, 81953.0, 108902.0, 130272.0, 136296.0, 124041.0, 100628.0, 72994.0, 49748.0, 32130.0, 20106.0, 12657.0, 7822.0, 4852.0, 3009.0, 1951.0, 1270.0, 855.0, 549.0, 383.0, 281.0, 151.0, 115.0, 85.0, 48.0, 29.0, 40.0, 19.0, 17.0, 12.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0], "bins": [-1.6044921875, -1.55487060546875, -1.5052490234375, -1.45562744140625, -1.406005859375, -1.35638427734375, -1.3067626953125, -1.25714111328125, -1.20751953125, -1.15789794921875, -1.1082763671875, -1.05865478515625, -1.009033203125, -0.95941162109375, -0.9097900390625, -0.86016845703125, -0.810546875, -0.76092529296875, -0.7113037109375, -0.66168212890625, -0.612060546875, -0.56243896484375, -0.5128173828125, -0.46319580078125, -0.41357421875, -0.36395263671875, -0.3143310546875, -0.26470947265625, -0.215087890625, -0.16546630859375, -0.1158447265625, -0.06622314453125, -0.0166015625, 0.03302001953125, 0.0826416015625, 0.13226318359375, 0.181884765625, 0.23150634765625, 0.2811279296875, 0.33074951171875, 0.38037109375, 0.42999267578125, 0.4796142578125, 0.52923583984375, 0.578857421875, 0.62847900390625, 0.6781005859375, 0.72772216796875, 0.77734375, 0.82696533203125, 0.8765869140625, 0.92620849609375, 0.975830078125, 1.02545166015625, 1.0750732421875, 1.12469482421875, 1.17431640625, 1.22393798828125, 1.2735595703125, 1.32318115234375, 1.372802734375, 1.42242431640625, 1.4720458984375, 1.52166748046875, 1.5712890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 8.0, 10.0, 4.0, 11.0, 10.0, 18.0, 19.0, 17.0, 28.0, 30.0, 40.0, 41.0, 52.0, 53.0, 73.0, 57.0, 54.0, 62.0, 51.0, 47.0, 45.0, 43.0, 32.0, 31.0, 34.0, 29.0, 23.0, 20.0, 10.0, 9.0, 7.0, 10.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.87548828125, -0.8503570556640625, -0.825225830078125, -0.8000946044921875, -0.77496337890625, -0.7498321533203125, -0.724700927734375, -0.6995697021484375, -0.6744384765625, -0.6493072509765625, -0.624176025390625, -0.5990447998046875, -0.57391357421875, -0.5487823486328125, -0.523651123046875, -0.4985198974609375, -0.473388671875, -0.4482574462890625, -0.423126220703125, -0.3979949951171875, -0.37286376953125, -0.3477325439453125, -0.322601318359375, -0.2974700927734375, -0.2723388671875, -0.2472076416015625, -0.222076416015625, -0.1969451904296875, -0.17181396484375, -0.1466827392578125, -0.121551513671875, -0.0964202880859375, -0.0712890625, -0.0461578369140625, -0.021026611328125, 0.0041046142578125, 0.02923583984375, 0.0543670654296875, 0.079498291015625, 0.1046295166015625, 0.1297607421875, 0.1548919677734375, 0.180023193359375, 0.2051544189453125, 0.23028564453125, 0.2554168701171875, 0.280548095703125, 0.3056793212890625, 0.330810546875, 0.3559417724609375, 0.381072998046875, 0.4062042236328125, 0.43133544921875, 0.4564666748046875, 0.481597900390625, 0.5067291259765625, 0.5318603515625, 0.5569915771484375, 0.582122802734375, 0.6072540283203125, 0.63238525390625, 0.6575164794921875, 0.682647705078125, 0.7077789306640625, 0.73291015625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 10.0, 14.0, 15.0, 24.0, 18.0, 21.0, 35.0, 33.0, 39.0, 28.0, 45.0, 42.0, 61.0, 61.0, 56.0, 53.0, 60.0, 51.0, 54.0, 49.0, 47.0, 35.0, 26.0, 21.0, 24.0, 13.0, 14.0, 8.0, 13.0, 10.0, 6.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.67264986038208, -6.455435276031494, -6.238221168518066, -6.0210065841674805, -5.803792476654053, -5.586577892303467, -5.369363784790039, -5.152149200439453, -4.934934616088867, -4.717720031738281, -4.5005059242248535, -4.283291339874268, -4.06607723236084, -3.848862648010254, -3.631648302078247, -3.4144339561462402, -3.1972198486328125, -2.9800055027008057, -2.762791156768799, -2.545576572418213, -2.328362464904785, -2.111147880554199, -1.8939335346221924, -1.6767191886901855, -1.4595048427581787, -1.2422904968261719, -1.025076150894165, -0.8078616857528687, -0.5906473398208618, -0.373432993888855, -0.1562185287475586, 0.06099581718444824, 0.2782106399536133, 0.4954250156879425, 0.7126393914222717, 0.9298537969589233, 1.1470681428909302, 1.364282488822937, 1.5814969539642334, 1.7987112998962402, 2.015925645828247, 2.233139991760254, 2.4503543376922607, 2.6675686836242676, 2.8847832679748535, 3.1019973754882812, 3.319211959838867, 3.536426305770874, 3.753640651702881, 3.9708549976348877, 4.1880693435668945, 4.4052839279174805, 4.622498035430908, 4.839712619781494, 5.056926727294922, 5.274141311645508, 5.491355895996094, 5.70857048034668, 5.925784587860107, 6.142999172210693, 6.360213279724121, 6.577427864074707, 6.794642448425293, 7.011856555938721, 7.229070663452148]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 2.0, 5.0, 6.0, 11.0, 10.0, 17.0, 11.0, 11.0, 21.0, 18.0, 28.0, 29.0, 32.0, 27.0, 30.0, 40.0, 37.0, 29.0, 31.0, 41.0, 33.0, 32.0, 43.0, 39.0, 38.0, 38.0, 35.0, 43.0, 31.0, 27.0, 27.0, 29.0, 23.0, 18.0, 22.0, 11.0, 14.0, 8.0, 16.0, 7.0, 3.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0682783126831055, -4.888309001922607, -4.708339691162109, -4.5283708572387695, -4.3484015464782715, -4.168432235717773, -3.9884629249572754, -3.8084936141967773, -3.6285245418548584, -3.4485552310943604, -3.2685861587524414, -3.0886168479919434, -2.9086475372314453, -2.7286784648895264, -2.5487091541290283, -2.3687400817871094, -2.1887707710266113, -2.0088014602661133, -1.8288323879241943, -1.6488630771636963, -1.4688938856124878, -1.2889246940612793, -1.1089553833007812, -0.9289861917495728, -0.7490170001983643, -0.5690478086471558, -0.3890785574913025, -0.20910930633544922, -0.029140114784240723, 0.15082907676696777, 0.3307983875274658, 0.5107675790786743, 0.6907362937927246, 0.8707054853439331, 1.0506746768951416, 1.2306439876556396, 1.4106131792068481, 1.5905823707580566, 1.7705516815185547, 1.9505208730697632, 2.1304900646209717, 2.3104593753814697, 2.4904284477233887, 2.6703977584838867, 2.8503670692443848, 3.0303361415863037, 3.2103054523468018, 3.3902745246887207, 3.5702438354492188, 3.750213146209717, 3.9301822185516357, 4.110151290893555, 4.290120601654053, 4.470089912414551, 4.650059223175049, 4.830028533935547, 5.009997367858887, 5.189966678619385, 5.369935989379883, 5.549904823303223, 5.729874134063721, 5.909843444824219, 6.089812755584717, 6.269782066345215, 6.449751377105713]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 1.0, 7.0, 13.0, 7.0, 15.0, 28.0, 40.0, 55.0, 77.0, 155.0, 206.0, 308.0, 507.0, 759.0, 1172.0, 1824.0, 3114.0, 5179.0, 9084.0, 15587.0, 28683.0, 53550.0, 104031.0, 203652.0, 385191.0, 633642.0, 816363.0, 764612.0, 534350.0, 302389.0, 156496.0, 80137.0, 41096.0, 22288.0, 12090.0, 7008.0, 4141.0, 2472.0, 1469.0, 941.0, 552.0, 388.0, 220.0, 160.0, 73.0, 60.0, 40.0, 21.0, 17.0, 5.0, 4.0, 6.0, 1.0], "bins": [-6.9765625, -6.7919921875, -6.607421875, -6.4228515625, -6.23828125, -6.0537109375, -5.869140625, -5.6845703125, -5.5, -5.3154296875, -5.130859375, -4.9462890625, -4.76171875, -4.5771484375, -4.392578125, -4.2080078125, -4.0234375, -3.8388671875, -3.654296875, -3.4697265625, -3.28515625, -3.1005859375, -2.916015625, -2.7314453125, -2.546875, -2.3623046875, -2.177734375, -1.9931640625, -1.80859375, -1.6240234375, -1.439453125, -1.2548828125, -1.0703125, -0.8857421875, -0.701171875, -0.5166015625, -0.33203125, -0.1474609375, 0.037109375, 0.2216796875, 0.40625, 0.5908203125, 0.775390625, 0.9599609375, 1.14453125, 1.3291015625, 1.513671875, 1.6982421875, 1.8828125, 2.0673828125, 2.251953125, 2.4365234375, 2.62109375, 2.8056640625, 2.990234375, 3.1748046875, 3.359375, 3.5439453125, 3.728515625, 3.9130859375, 4.09765625, 4.2822265625, 4.466796875, 4.6513671875, 4.8359375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 3.0, 3.0, 5.0, 9.0, 11.0, 10.0, 9.0, 12.0, 26.0, 22.0, 33.0, 24.0, 34.0, 32.0, 31.0, 34.0, 35.0, 46.0, 36.0, 43.0, 39.0, 40.0, 45.0, 37.0, 39.0, 28.0, 33.0, 40.0, 31.0, 32.0, 25.0, 28.0, 16.0, 23.0, 18.0, 13.0, 8.0, 9.0, 11.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84375, -4.6763916015625, -4.509033203125, -4.3416748046875, -4.17431640625, -4.0069580078125, -3.839599609375, -3.6722412109375, -3.5048828125, -3.3375244140625, -3.170166015625, -3.0028076171875, -2.83544921875, -2.6680908203125, -2.500732421875, -2.3333740234375, -2.166015625, -1.9986572265625, -1.831298828125, -1.6639404296875, -1.49658203125, -1.3292236328125, -1.161865234375, -0.9945068359375, -0.8271484375, -0.6597900390625, -0.492431640625, -0.3250732421875, -0.15771484375, 0.0096435546875, 0.177001953125, 0.3443603515625, 0.51171875, 0.6790771484375, 0.846435546875, 1.0137939453125, 1.18115234375, 1.3485107421875, 1.515869140625, 1.6832275390625, 1.8505859375, 2.0179443359375, 2.185302734375, 2.3526611328125, 2.52001953125, 2.6873779296875, 2.854736328125, 3.0220947265625, 3.189453125, 3.3568115234375, 3.524169921875, 3.6915283203125, 3.85888671875, 4.0262451171875, 4.193603515625, 4.3609619140625, 4.5283203125, 4.6956787109375, 4.863037109375, 5.0303955078125, 5.19775390625, 5.3651123046875, 5.532470703125, 5.6998291015625, 5.8671875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 18.0, 12.0, 29.0, 56.0, 84.0, 113.0, 184.0, 270.0, 398.0, 658.0, 1077.0, 1733.0, 2892.0, 4662.0, 7853.0, 13054.0, 22573.0, 38574.0, 65918.0, 111394.0, 183980.0, 292783.0, 431968.0, 567637.0, 630353.0, 580241.0, 449899.0, 305397.0, 193569.0, 117679.0, 69429.0, 40451.0, 24171.0, 14095.0, 8375.0, 4862.0, 2966.0, 1832.0, 1110.0, 679.0, 432.0, 292.0, 183.0, 123.0, 79.0, 49.0, 30.0, 27.0, 10.0, 8.0, 9.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3203125, -5.14617919921875, -4.9720458984375, -4.79791259765625, -4.623779296875, -4.44964599609375, -4.2755126953125, -4.10137939453125, -3.92724609375, -3.75311279296875, -3.5789794921875, -3.40484619140625, -3.230712890625, -3.05657958984375, -2.8824462890625, -2.70831298828125, -2.5341796875, -2.36004638671875, -2.1859130859375, -2.01177978515625, -1.837646484375, -1.66351318359375, -1.4893798828125, -1.31524658203125, -1.14111328125, -0.96697998046875, -0.7928466796875, -0.61871337890625, -0.444580078125, -0.27044677734375, -0.0963134765625, 0.07781982421875, 0.251953125, 0.42608642578125, 0.6002197265625, 0.77435302734375, 0.948486328125, 1.12261962890625, 1.2967529296875, 1.47088623046875, 1.64501953125, 1.81915283203125, 1.9932861328125, 2.16741943359375, 2.341552734375, 2.51568603515625, 2.6898193359375, 2.86395263671875, 3.0380859375, 3.21221923828125, 3.3863525390625, 3.56048583984375, 3.734619140625, 3.90875244140625, 4.0828857421875, 4.25701904296875, 4.43115234375, 4.60528564453125, 4.7794189453125, 4.95355224609375, 5.127685546875, 5.30181884765625, 5.4759521484375, 5.65008544921875, 5.82421875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 5.0, 2.0, 7.0, 12.0, 14.0, 24.0, 17.0, 43.0, 48.0, 36.0, 80.0, 77.0, 79.0, 100.0, 108.0, 145.0, 133.0, 152.0, 196.0, 189.0, 231.0, 235.0, 210.0, 214.0, 179.0, 204.0, 195.0, 169.0, 183.0, 140.0, 121.0, 89.0, 84.0, 75.0, 56.0, 37.0, 46.0, 34.0, 24.0, 13.0, 11.0, 14.0, 9.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 5.0], "bins": [-2.572265625, -2.50177001953125, -2.4312744140625, -2.36077880859375, -2.290283203125, -2.21978759765625, -2.1492919921875, -2.07879638671875, -2.00830078125, -1.93780517578125, -1.8673095703125, -1.79681396484375, -1.726318359375, -1.65582275390625, -1.5853271484375, -1.51483154296875, -1.4443359375, -1.37384033203125, -1.3033447265625, -1.23284912109375, -1.162353515625, -1.09185791015625, -1.0213623046875, -0.95086669921875, -0.88037109375, -0.80987548828125, -0.7393798828125, -0.66888427734375, -0.598388671875, -0.52789306640625, -0.4573974609375, -0.38690185546875, -0.31640625, -0.24591064453125, -0.1754150390625, -0.10491943359375, -0.034423828125, 0.03607177734375, 0.1065673828125, 0.17706298828125, 0.24755859375, 0.31805419921875, 0.3885498046875, 0.45904541015625, 0.529541015625, 0.60003662109375, 0.6705322265625, 0.74102783203125, 0.8115234375, 0.88201904296875, 0.9525146484375, 1.02301025390625, 1.093505859375, 1.16400146484375, 1.2344970703125, 1.30499267578125, 1.37548828125, 1.44598388671875, 1.5164794921875, 1.58697509765625, 1.657470703125, 1.72796630859375, 1.7984619140625, 1.86895751953125, 1.939453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 2.0, 3.0, 9.0, 6.0, 11.0, 15.0, 14.0, 34.0, 20.0, 24.0, 25.0, 27.0, 37.0, 48.0, 61.0, 47.0, 52.0, 48.0, 64.0, 53.0, 68.0, 52.0, 43.0, 36.0, 36.0, 33.0, 25.0, 34.0, 18.0, 13.0, 12.0, 5.0, 11.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4954023361206055, -7.268186092376709, -7.040969371795654, -6.813753128051758, -6.586536884307861, -6.359320640563965, -6.13210391998291, -5.904887676239014, -5.677671432495117, -5.450455188751221, -5.223238468170166, -4.9960222244262695, -4.768805980682373, -4.541589736938477, -4.314373016357422, -4.087156772613525, -3.8599400520324707, -3.632723569869995, -3.4055073261260986, -3.178290843963623, -2.9510746002197266, -2.723858118057251, -2.4966416358947754, -2.269425392150879, -2.0422089099884033, -1.8149925470352173, -1.5877761840820312, -1.3605597019195557, -1.1333433389663696, -0.9061269760131836, -0.678910493850708, -0.451694130897522, -0.22447776794433594, 0.0027386248111724854, 0.2299550175666809, 0.4571714401245117, 0.6843878030776978, 0.9116041660308838, 1.1388206481933594, 1.3660370111465454, 1.5932533740997314, 1.8204697370529175, 2.0476861000061035, 2.274902582168579, 2.5021190643310547, 2.729335308074951, 2.9565517902374268, 3.1837682723999023, 3.410984516143799, 3.6382009983062744, 3.865417242050171, 4.0926337242126465, 4.319849967956543, 4.547066688537598, 4.774282932281494, 5.001499176025391, 5.228715896606445, 5.455932140350342, 5.6831488609313965, 5.910365104675293, 6.1375813484191895, 6.364797592163086, 6.592014312744141, 6.819230556488037, 7.046446800231934]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 6.0, 10.0, 14.0, 9.0, 15.0, 29.0, 17.0, 25.0, 31.0, 28.0, 33.0, 33.0, 42.0, 32.0, 36.0, 31.0, 44.0, 40.0, 40.0, 50.0, 42.0, 42.0, 37.0, 34.0, 44.0, 27.0, 28.0, 19.0, 27.0, 23.0, 18.0, 13.0, 14.0, 8.0, 11.0, 11.0, 8.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64896821975708, -5.4565300941467285, -5.264091491699219, -5.071653366088867, -4.879215240478516, -4.686776638031006, -4.494338512420654, -4.3018999099731445, -4.109461784362793, -3.9170234203338623, -3.7245850563049316, -3.53214693069458, -3.3397085666656494, -3.1472702026367188, -2.954832077026367, -2.7623937129974365, -2.569955348968506, -2.377516984939575, -2.1850786209106445, -1.992640495300293, -1.8002021312713623, -1.6077637672424316, -1.4153255224227905, -1.2228872776031494, -1.0304489135742188, -0.8380106091499329, -0.645572304725647, -0.4531340003013611, -0.2606956958770752, -0.0682573914527893, 0.12418091297149658, 0.3166191577911377, 0.5090570449829102, 0.701495349407196, 0.8939336538314819, 1.086371898651123, 1.2788102626800537, 1.4712486267089844, 1.6636868715286255, 1.8561251163482666, 2.0485634803771973, 2.241001844406128, 2.4334402084350586, 2.62587833404541, 2.818316698074341, 3.0107550621032715, 3.203193187713623, 3.3956315517425537, 3.5880699157714844, 3.780508279800415, 3.9729466438293457, 4.165384769439697, 4.357823371887207, 4.550261497497559, 4.74269962310791, 4.935137748718262, 5.1275763511657715, 5.320014476776123, 5.512453079223633, 5.704891204833984, 5.897329330444336, 6.089767932891846, 6.282206058502197, 6.474644660949707, 6.667082786560059]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 9.0, 10.0, 20.0, 20.0, 32.0, 45.0, 71.0, 94.0, 138.0, 190.0, 258.0, 347.0, 528.0, 729.0, 1112.0, 1513.0, 2152.0, 3115.0, 4413.0, 6428.0, 9296.0, 14306.0, 20843.0, 30665.0, 45335.0, 65410.0, 91592.0, 119871.0, 137404.0, 132008.0, 107452.0, 78947.0, 55470.0, 38044.0, 25313.0, 17516.0, 11843.0, 7960.0, 5633.0, 3706.0, 2591.0, 1849.0, 1217.0, 919.0, 585.0, 450.0, 325.0, 242.0, 152.0, 113.0, 73.0, 53.0, 51.0, 39.0, 23.0, 22.0, 10.0, 6.0, 2.0, 5.0, 3.0], "bins": [-0.88671875, -0.8588104248046875, -0.830902099609375, -0.8029937744140625, -0.77508544921875, -0.7471771240234375, -0.719268798828125, -0.6913604736328125, -0.6634521484375, -0.6355438232421875, -0.607635498046875, -0.5797271728515625, -0.55181884765625, -0.5239105224609375, -0.496002197265625, -0.4680938720703125, -0.440185546875, -0.4122772216796875, -0.384368896484375, -0.3564605712890625, -0.32855224609375, -0.3006439208984375, -0.272735595703125, -0.2448272705078125, -0.2169189453125, -0.1890106201171875, -0.161102294921875, -0.1331939697265625, -0.10528564453125, -0.0773773193359375, -0.049468994140625, -0.0215606689453125, 0.00634765625, 0.0342559814453125, 0.062164306640625, 0.0900726318359375, 0.11798095703125, 0.1458892822265625, 0.173797607421875, 0.2017059326171875, 0.2296142578125, 0.2575225830078125, 0.285430908203125, 0.3133392333984375, 0.34124755859375, 0.3691558837890625, 0.397064208984375, 0.4249725341796875, 0.452880859375, 0.4807891845703125, 0.508697509765625, 0.5366058349609375, 0.56451416015625, 0.5924224853515625, 0.620330810546875, 0.6482391357421875, 0.6761474609375, 0.7040557861328125, 0.731964111328125, 0.7598724365234375, 0.78778076171875, 0.8156890869140625, 0.843597412109375, 0.8715057373046875, 0.8994140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 4.0, 2.0, 6.0, 6.0, 6.0, 10.0, 16.0, 13.0, 20.0, 18.0, 28.0, 29.0, 30.0, 29.0, 32.0, 38.0, 31.0, 25.0, 39.0, 45.0, 34.0, 46.0, 41.0, 42.0, 34.0, 47.0, 39.0, 40.0, 34.0, 30.0, 28.0, 23.0, 18.0, 25.0, 20.0, 9.0, 13.0, 14.0, 7.0, 8.0, 8.0, 1.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.29107666015625, -5.0938720703125, -4.89666748046875, -4.699462890625, -4.50225830078125, -4.3050537109375, -4.10784912109375, -3.91064453125, -3.71343994140625, -3.5162353515625, -3.31903076171875, -3.121826171875, -2.92462158203125, -2.7274169921875, -2.53021240234375, -2.3330078125, -2.13580322265625, -1.9385986328125, -1.74139404296875, -1.544189453125, -1.34698486328125, -1.1497802734375, -0.95257568359375, -0.75537109375, -0.55816650390625, -0.3609619140625, -0.16375732421875, 0.033447265625, 0.23065185546875, 0.4278564453125, 0.62506103515625, 0.822265625, 1.01947021484375, 1.2166748046875, 1.41387939453125, 1.611083984375, 1.80828857421875, 2.0054931640625, 2.20269775390625, 2.39990234375, 2.59710693359375, 2.7943115234375, 2.99151611328125, 3.188720703125, 3.38592529296875, 3.5831298828125, 3.78033447265625, 3.9775390625, 4.17474365234375, 4.3719482421875, 4.56915283203125, 4.766357421875, 4.96356201171875, 5.1607666015625, 5.35797119140625, 5.55517578125, 5.75238037109375, 5.9495849609375, 6.14678955078125, 6.343994140625, 6.54119873046875, 6.7384033203125, 6.93560791015625, 7.1328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 3.0, 3.0, 8.0, 4.0, 7.0, 9.0, 9.0, 14.0, 15.0, 26.0, 22.0, 51.0, 58.0, 84.0, 131.0, 211.0, 346.0, 553.0, 837.0, 1577.0, 2831.0, 5469.0, 11267.0, 24858.0, 117955.0, 797689.0, 47892.0, 18086.0, 8608.0, 4245.0, 2256.0, 1285.0, 790.0, 439.0, 288.0, 193.0, 130.0, 92.0, 50.0, 38.0, 32.0, 30.0, 13.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.818359375, -3.6964111328125, -3.574462890625, -3.4525146484375, -3.33056640625, -3.2086181640625, -3.086669921875, -2.9647216796875, -2.8427734375, -2.7208251953125, -2.598876953125, -2.4769287109375, -2.35498046875, -2.2330322265625, -2.111083984375, -1.9891357421875, -1.8671875, -1.7452392578125, -1.623291015625, -1.5013427734375, -1.37939453125, -1.2574462890625, -1.135498046875, -1.0135498046875, -0.8916015625, -0.7696533203125, -0.647705078125, -0.5257568359375, -0.40380859375, -0.2818603515625, -0.159912109375, -0.0379638671875, 0.083984375, 0.2059326171875, 0.327880859375, 0.4498291015625, 0.57177734375, 0.6937255859375, 0.815673828125, 0.9376220703125, 1.0595703125, 1.1815185546875, 1.303466796875, 1.4254150390625, 1.54736328125, 1.6693115234375, 1.791259765625, 1.9132080078125, 2.03515625, 2.1571044921875, 2.279052734375, 2.4010009765625, 2.52294921875, 2.6448974609375, 2.766845703125, 2.8887939453125, 3.0107421875, 3.1326904296875, 3.254638671875, 3.3765869140625, 3.49853515625, 3.6204833984375, 3.742431640625, 3.8643798828125, 3.986328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 8.0, 9.0, 12.0, 10.0, 21.0, 31.0, 31.0, 20.0, 29.0, 41.0, 25.0, 41.0, 39.0, 36.0, 50.0, 46.0, 43.0, 60.0, 42.0, 47.0, 40.0, 34.0, 39.0, 33.0, 26.0, 29.0, 28.0, 23.0, 24.0, 16.0, 17.0, 9.0, 7.0, 3.0, 6.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.18719482421875, -5.0345458984375, -4.88189697265625, -4.729248046875, -4.57659912109375, -4.4239501953125, -4.27130126953125, -4.11865234375, -3.96600341796875, -3.8133544921875, -3.66070556640625, -3.508056640625, -3.35540771484375, -3.2027587890625, -3.05010986328125, -2.8974609375, -2.74481201171875, -2.5921630859375, -2.43951416015625, -2.286865234375, -2.13421630859375, -1.9815673828125, -1.82891845703125, -1.67626953125, -1.52362060546875, -1.3709716796875, -1.21832275390625, -1.065673828125, -0.91302490234375, -0.7603759765625, -0.60772705078125, -0.455078125, -0.30242919921875, -0.1497802734375, 0.00286865234375, 0.155517578125, 0.30816650390625, 0.4608154296875, 0.61346435546875, 0.76611328125, 0.91876220703125, 1.0714111328125, 1.22406005859375, 1.376708984375, 1.52935791015625, 1.6820068359375, 1.83465576171875, 1.9873046875, 2.13995361328125, 2.2926025390625, 2.44525146484375, 2.597900390625, 2.75054931640625, 2.9031982421875, 3.05584716796875, 3.20849609375, 3.36114501953125, 3.5137939453125, 3.66644287109375, 3.819091796875, 3.97174072265625, 4.1243896484375, 4.27703857421875, 4.4296875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 7.0, 4.0, 7.0, 6.0, 10.0, 12.0, 21.0, 22.0, 40.0, 58.0, 52.0, 84.0, 129.0, 196.0, 225.0, 358.0, 500.0, 781.0, 1093.0, 1783.0, 2861.0, 4786.0, 8484.0, 16032.0, 36416.0, 586136.0, 321965.0, 31288.0, 14973.0, 7873.0, 4492.0, 2743.0, 1767.0, 1104.0, 696.0, 466.0, 286.0, 225.0, 154.0, 122.0, 64.0, 61.0, 40.0, 43.0, 26.0, 19.0, 15.0, 12.0, 9.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4248046875, -0.4106101989746094, -0.39641571044921875, -0.3822212219238281, -0.3680267333984375, -0.3538322448730469, -0.33963775634765625, -0.3254432678222656, -0.311248779296875, -0.2970542907714844, -0.28285980224609375, -0.2686653137207031, -0.2544708251953125, -0.24027633666992188, -0.22608184814453125, -0.21188735961914062, -0.19769287109375, -0.18349838256835938, -0.16930389404296875, -0.15510940551757812, -0.1409149169921875, -0.12672042846679688, -0.11252593994140625, -0.09833145141601562, -0.084136962890625, -0.06994247436523438, -0.05574798583984375, -0.041553497314453125, -0.0273590087890625, -0.013164520263671875, 0.00102996826171875, 0.015224456787109375, 0.0294189453125, 0.043613433837890625, 0.05780792236328125, 0.07200241088867188, 0.0861968994140625, 0.10039138793945312, 0.11458587646484375, 0.12878036499023438, 0.142974853515625, 0.15716934204101562, 0.17136383056640625, 0.18555831909179688, 0.1997528076171875, 0.21394729614257812, 0.22814178466796875, 0.24233627319335938, 0.25653076171875, 0.2707252502441406, 0.28491973876953125, 0.2991142272949219, 0.3133087158203125, 0.3275032043457031, 0.34169769287109375, 0.3558921813964844, 0.370086669921875, 0.3842811584472656, 0.39847564697265625, 0.4126701354980469, 0.4268646240234375, 0.4410591125488281, 0.45525360107421875, 0.4694480895996094, 0.483642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 9.0, 6.0, 8.0, 9.0, 25.0, 13.0, 20.0, 33.0, 26.0, 20.0, 32.0, 51.0, 58.0, 63.0, 59.0, 72.0, 68.0, 54.0, 63.0, 54.0, 43.0, 38.0, 40.0, 21.0, 35.0, 15.0, 13.0, 11.0, 11.0, 2.0, 7.0, 4.0, 2.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4960765838623047e-05, -1.4440156519412994e-05, -1.3919547200202942e-05, -1.339893788099289e-05, -1.2878328561782837e-05, -1.2357719242572784e-05, -1.1837109923362732e-05, -1.131650060415268e-05, -1.0795891284942627e-05, -1.0275281965732574e-05, -9.754672646522522e-06, -9.23406332731247e-06, -8.713454008102417e-06, -8.192844688892365e-06, -7.672235369682312e-06, -7.1516260504722595e-06, -6.631016731262207e-06, -6.1104074120521545e-06, -5.589798092842102e-06, -5.0691887736320496e-06, -4.548579454421997e-06, -4.027970135211945e-06, -3.507360816001892e-06, -2.9867514967918396e-06, -2.466142177581787e-06, -1.9455328583717346e-06, -1.4249235391616821e-06, -9.043142199516296e-07, -3.8370490074157715e-07, 1.3690441846847534e-07, 6.575137376785278e-07, 1.1781230568885803e-06, 1.6987323760986328e-06, 2.2193416953086853e-06, 2.739951014518738e-06, 3.2605603337287903e-06, 3.7811696529388428e-06, 4.301778972148895e-06, 4.822388291358948e-06, 5.342997610569e-06, 5.863606929779053e-06, 6.384216248989105e-06, 6.904825568199158e-06, 7.42543488740921e-06, 7.946044206619263e-06, 8.466653525829315e-06, 8.987262845039368e-06, 9.50787216424942e-06, 1.0028481483459473e-05, 1.0549090802669525e-05, 1.1069700121879578e-05, 1.159030944108963e-05, 1.2110918760299683e-05, 1.2631528079509735e-05, 1.3152137398719788e-05, 1.367274671792984e-05, 1.4193356037139893e-05, 1.4713965356349945e-05, 1.5234574675559998e-05, 1.575518399477005e-05, 1.6275793313980103e-05, 1.6796402633190155e-05, 1.7317011952400208e-05, 1.783762127161026e-05, 1.8358230590820312e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 2.0, 9.0, 16.0, 19.0, 25.0, 35.0, 62.0, 76.0, 116.0, 147.0, 231.0, 359.0, 534.0, 870.0, 1531.0, 2678.0, 4632.0, 8377.0, 15220.0, 28101.0, 52453.0, 96275.0, 172168.0, 242117.0, 186876.0, 107516.0, 58307.0, 31434.0, 16974.0, 8962.0, 5041.0, 2951.0, 1626.0, 1032.0, 601.0, 365.0, 266.0, 175.0, 123.0, 87.0, 60.0, 25.0, 21.0, 21.0, 12.0, 9.0, 6.0, 1.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.52978515625, -0.5135269165039062, -0.4972686767578125, -0.48101043701171875, -0.464752197265625, -0.44849395751953125, -0.4322357177734375, -0.41597747802734375, -0.39971923828125, -0.38346099853515625, -0.3672027587890625, -0.35094451904296875, -0.334686279296875, -0.31842803955078125, -0.3021697998046875, -0.28591156005859375, -0.2696533203125, -0.25339508056640625, -0.2371368408203125, -0.22087860107421875, -0.204620361328125, -0.18836212158203125, -0.1721038818359375, -0.15584564208984375, -0.13958740234375, -0.12332916259765625, -0.1070709228515625, -0.09081268310546875, -0.074554443359375, -0.05829620361328125, -0.0420379638671875, -0.02577972412109375, -0.009521484375, 0.00673675537109375, 0.0229949951171875, 0.03925323486328125, 0.055511474609375, 0.07176971435546875, 0.0880279541015625, 0.10428619384765625, 0.12054443359375, 0.13680267333984375, 0.1530609130859375, 0.16931915283203125, 0.185577392578125, 0.20183563232421875, 0.2180938720703125, 0.23435211181640625, 0.2506103515625, 0.26686859130859375, 0.2831268310546875, 0.29938507080078125, 0.315643310546875, 0.33190155029296875, 0.3481597900390625, 0.36441802978515625, 0.38067626953125, 0.39693450927734375, 0.4131927490234375, 0.42945098876953125, 0.445709228515625, 0.46196746826171875, 0.4782257080078125, 0.49448394775390625, 0.5107421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 7.0, 4.0, 16.0, 13.0, 14.0, 15.0, 29.0, 31.0, 50.0, 39.0, 51.0, 56.0, 83.0, 96.0, 79.0, 82.0, 70.0, 61.0, 44.0, 41.0, 27.0, 22.0, 19.0, 8.0, 13.0, 12.0, 7.0, 4.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33251953125, -0.32283782958984375, -0.3131561279296875, -0.30347442626953125, -0.293792724609375, -0.28411102294921875, -0.2744293212890625, -0.26474761962890625, -0.25506591796875, -0.24538421630859375, -0.2357025146484375, -0.22602081298828125, -0.216339111328125, -0.20665740966796875, -0.1969757080078125, -0.18729400634765625, -0.1776123046875, -0.16793060302734375, -0.1582489013671875, -0.14856719970703125, -0.138885498046875, -0.12920379638671875, -0.1195220947265625, -0.10984039306640625, -0.10015869140625, -0.09047698974609375, -0.0807952880859375, -0.07111358642578125, -0.061431884765625, -0.05175018310546875, -0.0420684814453125, -0.03238677978515625, -0.022705078125, -0.01302337646484375, -0.0033416748046875, 0.00634002685546875, 0.016021728515625, 0.02570343017578125, 0.0353851318359375, 0.04506683349609375, 0.05474853515625, 0.06443023681640625, 0.0741119384765625, 0.08379364013671875, 0.093475341796875, 0.10315704345703125, 0.1128387451171875, 0.12252044677734375, 0.1322021484375, 0.14188385009765625, 0.1515655517578125, 0.16124725341796875, 0.170928955078125, 0.18061065673828125, 0.1902923583984375, 0.19997406005859375, 0.20965576171875, 0.21933746337890625, 0.2290191650390625, 0.23870086669921875, 0.248382568359375, 0.25806427001953125, 0.2677459716796875, 0.27742767333984375, 0.287109375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 8.0, 7.0, 20.0, 15.0, 30.0, 19.0, 29.0, 18.0, 33.0, 32.0, 44.0, 56.0, 56.0, 43.0, 54.0, 52.0, 55.0, 65.0, 60.0, 40.0, 39.0, 34.0, 34.0, 29.0, 28.0, 25.0, 16.0, 8.0, 9.0, 12.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.325235366821289, -7.103611469268799, -6.881987571716309, -6.66036319732666, -6.43873929977417, -6.21711540222168, -5.9954915046691895, -5.773867607116699, -5.552243232727051, -5.3306193351745605, -5.10899543762207, -4.887371063232422, -4.665747165679932, -4.444123268127441, -4.222499370574951, -4.000875473022461, -3.7792515754699707, -3.5576276779174805, -3.336003541946411, -3.114379644393921, -2.8927555084228516, -2.6711316108703613, -2.449507713317871, -2.227883815765381, -2.0062596797943115, -1.7846356630325317, -1.563011646270752, -1.3413877487182617, -1.119763731956482, -0.8981397151947021, -0.6765158176422119, -0.45489180088043213, -0.23326826095581055, -0.01164427399635315, 0.20997971296310425, 0.43160367012023926, 0.653227686882019, 0.8748517036437988, 1.096475601196289, 1.3180996179580688, 1.5397236347198486, 1.7613476514816284, 1.9829716682434082, 2.2045955657958984, 2.4262194633483887, 2.647843599319458, 2.8694674968719482, 3.0910916328430176, 3.312715530395508, 3.534339427947998, 3.7559635639190674, 3.9775874614715576, 4.199211597442627, 4.420835494995117, 4.642459392547607, 4.864083290100098, 5.085707664489746, 5.307331562042236, 5.528955459594727, 5.750579833984375, 5.972203731536865, 6.1938276290893555, 6.415451526641846, 6.637075424194336, 6.858699321746826]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 7.0, 7.0, 12.0, 11.0, 12.0, 19.0, 28.0, 16.0, 25.0, 30.0, 32.0, 29.0, 37.0, 30.0, 37.0, 33.0, 36.0, 40.0, 44.0, 47.0, 34.0, 40.0, 31.0, 43.0, 41.0, 31.0, 35.0, 29.0, 17.0, 27.0, 27.0, 16.0, 11.0, 16.0, 7.0, 14.0, 5.0, 15.0, 5.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.429180145263672, -5.243146896362305, -5.0571136474609375, -4.87108039855957, -4.685047149658203, -4.499014377593994, -4.312981128692627, -4.12694787979126, -3.9409146308898926, -3.7548813819885254, -3.568848133087158, -3.38281512260437, -3.196781873703003, -3.0107486248016357, -2.8247156143188477, -2.6386823654174805, -2.4526491165161133, -2.266615867614746, -2.080582618713379, -1.8945496082305908, -1.7085163593292236, -1.5224831104278564, -1.3364499807357788, -1.1504168510437012, -0.964383602142334, -0.7783504128456116, -0.5923172235488892, -0.40628403425216675, -0.22025084495544434, -0.034217655658721924, 0.1518155336380005, 0.3378486633300781, 0.5238823890686035, 0.7099155783653259, 0.8959487676620483, 1.081981897354126, 1.2680151462554932, 1.4540483951568604, 1.640081524848938, 1.8261146545410156, 2.012147903442383, 2.19818115234375, 2.384214401245117, 2.5702474117279053, 2.7562806606292725, 2.9423139095306396, 3.1283469200134277, 3.314380168914795, 3.500413417816162, 3.6864466667175293, 3.8724799156188965, 4.058513164520264, 4.244545936584473, 4.43057918548584, 4.616612434387207, 4.802645683288574, 4.988678932189941, 5.174712181091309, 5.360745429992676, 5.546778678894043, 5.73281192779541, 5.918844699859619, 6.104877948760986, 6.2909111976623535, 6.476944446563721]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 8.0, 18.0, 23.0, 31.0, 62.0, 96.0, 124.0, 200.0, 265.0, 458.0, 649.0, 1014.0, 1459.0, 2272.0, 3316.0, 5150.0, 7816.0, 11766.0, 18110.0, 27972.0, 42099.0, 62160.0, 87607.0, 113337.0, 131058.0, 131935.0, 116296.0, 89745.0, 64642.0, 44340.0, 29201.0, 19083.0, 12428.0, 8052.0, 5315.0, 3508.0, 2304.0, 1500.0, 1038.0, 703.0, 462.0, 338.0, 199.0, 130.0, 98.0, 55.0, 40.0, 24.0, 26.0, 11.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.6015625, -4.46234130859375, -4.3231201171875, -4.18389892578125, -4.044677734375, -3.90545654296875, -3.7662353515625, -3.62701416015625, -3.48779296875, -3.34857177734375, -3.2093505859375, -3.07012939453125, -2.930908203125, -2.79168701171875, -2.6524658203125, -2.51324462890625, -2.3740234375, -2.23480224609375, -2.0955810546875, -1.95635986328125, -1.817138671875, -1.67791748046875, -1.5386962890625, -1.39947509765625, -1.26025390625, -1.12103271484375, -0.9818115234375, -0.84259033203125, -0.703369140625, -0.56414794921875, -0.4249267578125, -0.28570556640625, -0.146484375, -0.00726318359375, 0.1319580078125, 0.27117919921875, 0.410400390625, 0.54962158203125, 0.6888427734375, 0.82806396484375, 0.96728515625, 1.10650634765625, 1.2457275390625, 1.38494873046875, 1.524169921875, 1.66339111328125, 1.8026123046875, 1.94183349609375, 2.0810546875, 2.22027587890625, 2.3594970703125, 2.49871826171875, 2.637939453125, 2.77716064453125, 2.9163818359375, 3.05560302734375, 3.19482421875, 3.33404541015625, 3.4732666015625, 3.61248779296875, 3.751708984375, 3.89093017578125, 4.0301513671875, 4.16937255859375, 4.30859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 9.0, 7.0, 12.0, 19.0, 14.0, 17.0, 12.0, 19.0, 23.0, 33.0, 30.0, 33.0, 32.0, 31.0, 31.0, 29.0, 34.0, 41.0, 44.0, 40.0, 32.0, 39.0, 44.0, 39.0, 38.0, 27.0, 34.0, 29.0, 29.0, 23.0, 23.0, 13.0, 18.0, 13.0, 13.0, 13.0, 11.0, 6.0, 9.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3046875, -5.125732421875, -4.94677734375, -4.767822265625, -4.5888671875, -4.409912109375, -4.23095703125, -4.052001953125, -3.873046875, -3.694091796875, -3.51513671875, -3.336181640625, -3.1572265625, -2.978271484375, -2.79931640625, -2.620361328125, -2.44140625, -2.262451171875, -2.08349609375, -1.904541015625, -1.7255859375, -1.546630859375, -1.36767578125, -1.188720703125, -1.009765625, -0.830810546875, -0.65185546875, -0.472900390625, -0.2939453125, -0.114990234375, 0.06396484375, 0.242919921875, 0.421875, 0.600830078125, 0.77978515625, 0.958740234375, 1.1376953125, 1.316650390625, 1.49560546875, 1.674560546875, 1.853515625, 2.032470703125, 2.21142578125, 2.390380859375, 2.5693359375, 2.748291015625, 2.92724609375, 3.106201171875, 3.28515625, 3.464111328125, 3.64306640625, 3.822021484375, 4.0009765625, 4.179931640625, 4.35888671875, 4.537841796875, 4.716796875, 4.895751953125, 5.07470703125, 5.253662109375, 5.4326171875, 5.611572265625, 5.79052734375, 5.969482421875, 6.1484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 13.0, 24.0, 28.0, 45.0, 74.0, 100.0, 169.0, 252.0, 409.0, 667.0, 964.0, 1547.0, 2338.0, 3413.0, 5408.0, 8446.0, 13046.0, 19797.0, 30422.0, 46008.0, 65693.0, 90549.0, 114836.0, 129347.0, 128394.0, 111531.0, 86602.0, 63263.0, 42846.0, 28578.0, 18655.0, 12460.0, 8020.0, 5045.0, 3282.0, 2215.0, 1437.0, 948.0, 612.0, 338.0, 287.0, 148.0, 97.0, 77.0, 46.0, 22.0, 14.0, 12.0, 12.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-4.84375, -4.6966552734375, -4.549560546875, -4.4024658203125, -4.25537109375, -4.1082763671875, -3.961181640625, -3.8140869140625, -3.6669921875, -3.5198974609375, -3.372802734375, -3.2257080078125, -3.07861328125, -2.9315185546875, -2.784423828125, -2.6373291015625, -2.490234375, -2.3431396484375, -2.196044921875, -2.0489501953125, -1.90185546875, -1.7547607421875, -1.607666015625, -1.4605712890625, -1.3134765625, -1.1663818359375, -1.019287109375, -0.8721923828125, -0.72509765625, -0.5780029296875, -0.430908203125, -0.2838134765625, -0.13671875, 0.0103759765625, 0.157470703125, 0.3045654296875, 0.45166015625, 0.5987548828125, 0.745849609375, 0.8929443359375, 1.0400390625, 1.1871337890625, 1.334228515625, 1.4813232421875, 1.62841796875, 1.7755126953125, 1.922607421875, 2.0697021484375, 2.216796875, 2.3638916015625, 2.510986328125, 2.6580810546875, 2.80517578125, 2.9522705078125, 3.099365234375, 3.2464599609375, 3.3935546875, 3.5406494140625, 3.687744140625, 3.8348388671875, 3.98193359375, 4.1290283203125, 4.276123046875, 4.4232177734375, 4.5703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 6.0, 1.0, 8.0, 7.0, 13.0, 8.0, 14.0, 14.0, 15.0, 17.0, 22.0, 15.0, 21.0, 25.0, 31.0, 31.0, 34.0, 50.0, 35.0, 40.0, 41.0, 32.0, 42.0, 34.0, 32.0, 35.0, 40.0, 41.0, 33.0, 28.0, 28.0, 23.0, 25.0, 18.0, 18.0, 15.0, 15.0, 15.0, 12.0, 12.0, 12.0, 11.0, 10.0, 8.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 4.0, 1.0], "bins": [-3.6953125, -3.58734130859375, -3.4793701171875, -3.37139892578125, -3.263427734375, -3.15545654296875, -3.0474853515625, -2.93951416015625, -2.83154296875, -2.72357177734375, -2.6156005859375, -2.50762939453125, -2.399658203125, -2.29168701171875, -2.1837158203125, -2.07574462890625, -1.9677734375, -1.85980224609375, -1.7518310546875, -1.64385986328125, -1.535888671875, -1.42791748046875, -1.3199462890625, -1.21197509765625, -1.10400390625, -0.99603271484375, -0.8880615234375, -0.78009033203125, -0.672119140625, -0.56414794921875, -0.4561767578125, -0.34820556640625, -0.240234375, -0.13226318359375, -0.0242919921875, 0.08367919921875, 0.191650390625, 0.29962158203125, 0.4075927734375, 0.51556396484375, 0.62353515625, 0.73150634765625, 0.8394775390625, 0.94744873046875, 1.055419921875, 1.16339111328125, 1.2713623046875, 1.37933349609375, 1.4873046875, 1.59527587890625, 1.7032470703125, 1.81121826171875, 1.919189453125, 2.02716064453125, 2.1351318359375, 2.24310302734375, 2.35107421875, 2.45904541015625, 2.5670166015625, 2.67498779296875, 2.782958984375, 2.89093017578125, 2.9989013671875, 3.10687255859375, 3.21484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 18.0, 11.0, 22.0, 18.0, 43.0, 42.0, 63.0, 92.0, 139.0, 146.0, 258.0, 394.0, 546.0, 852.0, 1294.0, 2000.0, 3291.0, 5365.0, 8822.0, 15029.0, 25836.0, 44093.0, 72390.0, 109074.0, 142702.0, 159217.0, 147682.0, 114098.0, 77459.0, 47521.0, 28351.0, 16410.0, 9606.0, 5809.0, 3480.0, 2217.0, 1406.0, 864.0, 569.0, 381.0, 293.0, 212.0, 120.0, 104.0, 58.0, 47.0, 32.0, 26.0, 18.0, 14.0, 3.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.888671875, -1.828857421875, -1.76904296875, -1.709228515625, -1.6494140625, -1.589599609375, -1.52978515625, -1.469970703125, -1.41015625, -1.350341796875, -1.29052734375, -1.230712890625, -1.1708984375, -1.111083984375, -1.05126953125, -0.991455078125, -0.931640625, -0.871826171875, -0.81201171875, -0.752197265625, -0.6923828125, -0.632568359375, -0.57275390625, -0.512939453125, -0.453125, -0.393310546875, -0.33349609375, -0.273681640625, -0.2138671875, -0.154052734375, -0.09423828125, -0.034423828125, 0.025390625, 0.085205078125, 0.14501953125, 0.204833984375, 0.2646484375, 0.324462890625, 0.38427734375, 0.444091796875, 0.50390625, 0.563720703125, 0.62353515625, 0.683349609375, 0.7431640625, 0.802978515625, 0.86279296875, 0.922607421875, 0.982421875, 1.042236328125, 1.10205078125, 1.161865234375, 1.2216796875, 1.281494140625, 1.34130859375, 1.401123046875, 1.4609375, 1.520751953125, 1.58056640625, 1.640380859375, 1.7001953125, 1.760009765625, 1.81982421875, 1.879638671875, 1.939453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 8.0, 13.0, 8.0, 12.0, 15.0, 20.0, 21.0, 22.0, 25.0, 32.0, 54.0, 64.0, 42.0, 48.0, 52.0, 46.0, 62.0, 54.0, 54.0, 59.0, 40.0, 51.0, 30.0, 31.0, 22.0, 18.0, 22.0, 17.0, 9.0, 12.0, 11.0, 7.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001703500747680664, -0.0001637544482946396, -0.00015715882182121277, -0.00015056319534778595, -0.00014396756887435913, -0.0001373719424009323, -0.0001307763159275055, -0.00012418068945407867, -0.00011758506298065186, -0.00011098943650722504, -0.00010439381003379822, -9.77981835603714e-05, -9.120255708694458e-05, -8.460693061351776e-05, -7.801130414009094e-05, -7.141567766666412e-05, -6.48200511932373e-05, -5.8224424719810486e-05, -5.162879824638367e-05, -4.503317177295685e-05, -3.843754529953003e-05, -3.184191882610321e-05, -2.524629235267639e-05, -1.8650665879249573e-05, -1.2055039405822754e-05, -5.459412932395935e-06, 1.1362135410308838e-06, 7.731840014457703e-06, 1.4327466487884521e-05, 2.092309296131134e-05, 2.751871943473816e-05, 3.411434590816498e-05, 4.07099723815918e-05, 4.7305598855018616e-05, 5.3901225328445435e-05, 6.0496851801872253e-05, 6.709247827529907e-05, 7.368810474872589e-05, 8.028373122215271e-05, 8.687935769557953e-05, 9.347498416900635e-05, 0.00010007061064243317, 0.00010666623711585999, 0.0001132618635892868, 0.00011985749006271362, 0.00012645311653614044, 0.00013304874300956726, 0.00013964436948299408, 0.0001462399959564209, 0.00015283562242984772, 0.00015943124890327454, 0.00016602687537670135, 0.00017262250185012817, 0.000179218128323555, 0.0001858137547969818, 0.00019240938127040863, 0.00019900500774383545, 0.00020560063421726227, 0.0002121962606906891, 0.0002187918871641159, 0.00022538751363754272, 0.00023198314011096954, 0.00023857876658439636, 0.0002451743930578232, 0.00025177001953125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 6.0, 3.0, 3.0, 8.0, 10.0, 25.0, 30.0, 42.0, 64.0, 65.0, 106.0, 174.0, 233.0, 342.0, 480.0, 799.0, 1101.0, 1553.0, 2386.0, 3728.0, 5929.0, 9556.0, 15300.0, 24575.0, 39483.0, 60585.0, 88353.0, 117851.0, 138683.0, 139500.0, 121984.0, 94586.0, 65750.0, 42573.0, 26910.0, 16875.0, 10276.0, 6414.0, 4059.0, 2677.0, 1746.0, 1171.0, 775.0, 535.0, 392.0, 250.0, 173.0, 122.0, 83.0, 73.0, 47.0, 33.0, 23.0, 23.0, 16.0, 7.0, 7.0, 6.0, 5.0, 4.0, 3.0], "bins": [-1.8134765625, -1.7569732666015625, -1.700469970703125, -1.6439666748046875, -1.58746337890625, -1.5309600830078125, -1.474456787109375, -1.4179534912109375, -1.3614501953125, -1.3049468994140625, -1.248443603515625, -1.1919403076171875, -1.13543701171875, -1.0789337158203125, -1.022430419921875, -0.9659271240234375, -0.909423828125, -0.8529205322265625, -0.796417236328125, -0.7399139404296875, -0.68341064453125, -0.6269073486328125, -0.570404052734375, -0.5139007568359375, -0.4573974609375, -0.4008941650390625, -0.344390869140625, -0.2878875732421875, -0.23138427734375, -0.1748809814453125, -0.118377685546875, -0.0618743896484375, -0.00537109375, 0.0511322021484375, 0.107635498046875, 0.1641387939453125, 0.22064208984375, 0.2771453857421875, 0.333648681640625, 0.3901519775390625, 0.4466552734375, 0.5031585693359375, 0.559661865234375, 0.6161651611328125, 0.67266845703125, 0.7291717529296875, 0.785675048828125, 0.8421783447265625, 0.898681640625, 0.9551849365234375, 1.011688232421875, 1.0681915283203125, 1.12469482421875, 1.1811981201171875, 1.237701416015625, 1.2942047119140625, 1.3507080078125, 1.4072113037109375, 1.463714599609375, 1.5202178955078125, 1.57672119140625, 1.6332244873046875, 1.689727783203125, 1.7462310791015625, 1.802734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 2.0, 13.0, 11.0, 9.0, 11.0, 20.0, 21.0, 24.0, 32.0, 29.0, 34.0, 62.0, 62.0, 54.0, 68.0, 55.0, 78.0, 65.0, 66.0, 49.0, 44.0, 32.0, 34.0, 25.0, 23.0, 13.0, 13.0, 14.0, 7.0, 5.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0771484375, -1.0475311279296875, -1.017913818359375, -0.9882965087890625, -0.95867919921875, -0.9290618896484375, -0.899444580078125, -0.8698272705078125, -0.8402099609375, -0.8105926513671875, -0.780975341796875, -0.7513580322265625, -0.72174072265625, -0.6921234130859375, -0.662506103515625, -0.6328887939453125, -0.603271484375, -0.5736541748046875, -0.544036865234375, -0.5144195556640625, -0.48480224609375, -0.4551849365234375, -0.425567626953125, -0.3959503173828125, -0.3663330078125, -0.3367156982421875, -0.307098388671875, -0.2774810791015625, -0.24786376953125, -0.2182464599609375, -0.188629150390625, -0.1590118408203125, -0.12939453125, -0.0997772216796875, -0.070159912109375, -0.0405426025390625, -0.01092529296875, 0.0186920166015625, 0.048309326171875, 0.0779266357421875, 0.1075439453125, 0.1371612548828125, 0.166778564453125, 0.1963958740234375, 0.22601318359375, 0.2556304931640625, 0.285247802734375, 0.3148651123046875, 0.344482421875, 0.3740997314453125, 0.403717041015625, 0.4333343505859375, 0.46295166015625, 0.4925689697265625, 0.522186279296875, 0.5518035888671875, 0.5814208984375, 0.6110382080078125, 0.640655517578125, 0.6702728271484375, 0.69989013671875, 0.7295074462890625, 0.759124755859375, 0.7887420654296875, 0.818359375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 7.0, 10.0, 11.0, 10.0, 10.0, 21.0, 22.0, 17.0, 20.0, 25.0, 27.0, 43.0, 51.0, 48.0, 50.0, 52.0, 63.0, 39.0, 55.0, 51.0, 57.0, 40.0, 47.0, 34.0, 25.0, 29.0, 34.0, 21.0, 16.0, 14.0, 17.0, 6.0, 5.0, 5.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.950682163238525, -6.733675956726074, -6.516669750213623, -6.299663543701172, -6.082657337188721, -5.8656511306762695, -5.648644924163818, -5.431638717651367, -5.214632511138916, -4.997626304626465, -4.780620098114014, -4.5636138916015625, -4.346607685089111, -4.12960147857666, -3.912595272064209, -3.695589065551758, -3.4785828590393066, -3.2615766525268555, -3.0445704460144043, -2.827564239501953, -2.610558032989502, -2.393551826477051, -2.1765456199645996, -1.9595394134521484, -1.7425332069396973, -1.525527000427246, -1.308520793914795, -1.0915145874023438, -0.8745083808898926, -0.6575021743774414, -0.44049596786499023, -0.22348976135253906, -0.006484031677246094, 0.21052217483520508, 0.42752838134765625, 0.6445345878601074, 0.8615407943725586, 1.0785470008850098, 1.295553207397461, 1.512559413909912, 1.7295656204223633, 1.9465718269348145, 2.1635780334472656, 2.380584239959717, 2.597590446472168, 2.814596652984619, 3.0316028594970703, 3.2486090660095215, 3.4656152725219727, 3.682621479034424, 3.899627685546875, 4.116633892059326, 4.333640098571777, 4.5506463050842285, 4.76765251159668, 4.984658718109131, 5.201664924621582, 5.418671131134033, 5.635677337646484, 5.8526835441589355, 6.069689750671387, 6.286695957183838, 6.503702163696289, 6.72070837020874, 6.937714576721191]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 9.0, 1.0, 14.0, 5.0, 8.0, 10.0, 21.0, 15.0, 28.0, 26.0, 32.0, 37.0, 27.0, 34.0, 28.0, 43.0, 37.0, 31.0, 39.0, 37.0, 31.0, 36.0, 41.0, 42.0, 39.0, 48.0, 27.0, 28.0, 32.0, 28.0, 26.0, 19.0, 15.0, 19.0, 14.0, 10.0, 12.0, 12.0, 12.0, 9.0, 3.0, 8.0, 6.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.607245445251465, -5.403995513916016, -5.200745582580566, -4.997495651245117, -4.79424524307251, -4.5909953117370605, -4.387745380401611, -4.184495449066162, -3.981245279312134, -3.7779953479766846, -3.5747451782226562, -3.371495246887207, -3.168245315551758, -2.9649951457977295, -2.7617452144622803, -2.558495044708252, -2.3552451133728027, -2.1519951820373535, -1.9487450122833252, -1.745495080947876, -1.5422450304031372, -1.3389949798583984, -1.1357450485229492, -0.9324949979782104, -0.7292449474334717, -0.5259948968887329, -0.3227449059486389, -0.11949491500854492, 0.08375513553619385, 0.2870051860809326, 0.49025511741638184, 0.6935051679611206, 0.8967547416687012, 1.10000479221344, 1.3032548427581787, 1.506504774093628, 1.7097548246383667, 1.9130048751831055, 2.1162548065185547, 2.319504737854004, 2.5227549076080322, 2.7260048389434814, 2.9292550086975098, 3.132504940032959, 3.335754871368408, 3.5390050411224365, 3.7422549724578857, 3.945505142211914, 4.148755073547363, 4.3520050048828125, 4.555254936218262, 4.758504867553711, 4.961755275726318, 5.165005207061768, 5.368255138397217, 5.571505069732666, 5.774755477905273, 5.978005409240723, 6.181255340576172, 6.384505271911621, 6.5877556800842285, 6.791005611419678, 6.994255542755127, 7.197505474090576, 7.400755405426025]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 8.0, 14.0, 21.0, 28.0, 52.0, 64.0, 93.0, 121.0, 188.0, 296.0, 488.0, 760.0, 1236.0, 1829.0, 3148.0, 5506.0, 9411.0, 16824.0, 30870.0, 58254.0, 111638.0, 214230.0, 388771.0, 619614.0, 786190.0, 743467.0, 532023.0, 314166.0, 167224.0, 86659.0, 45431.0, 24406.0, 13344.0, 7355.0, 4219.0, 2517.0, 1401.0, 878.0, 520.0, 346.0, 256.0, 132.0, 98.0, 64.0, 44.0, 24.0, 24.0, 9.0, 9.0, 10.0, 2.0, 0.0, 3.0], "bins": [-6.90625, -6.71337890625, -6.5205078125, -6.32763671875, -6.134765625, -5.94189453125, -5.7490234375, -5.55615234375, -5.36328125, -5.17041015625, -4.9775390625, -4.78466796875, -4.591796875, -4.39892578125, -4.2060546875, -4.01318359375, -3.8203125, -3.62744140625, -3.4345703125, -3.24169921875, -3.048828125, -2.85595703125, -2.6630859375, -2.47021484375, -2.27734375, -2.08447265625, -1.8916015625, -1.69873046875, -1.505859375, -1.31298828125, -1.1201171875, -0.92724609375, -0.734375, -0.54150390625, -0.3486328125, -0.15576171875, 0.037109375, 0.22998046875, 0.4228515625, 0.61572265625, 0.80859375, 1.00146484375, 1.1943359375, 1.38720703125, 1.580078125, 1.77294921875, 1.9658203125, 2.15869140625, 2.3515625, 2.54443359375, 2.7373046875, 2.93017578125, 3.123046875, 3.31591796875, 3.5087890625, 3.70166015625, 3.89453125, 4.08740234375, 4.2802734375, 4.47314453125, 4.666015625, 4.85888671875, 5.0517578125, 5.24462890625, 5.4375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 6.0, 4.0, 8.0, 10.0, 16.0, 21.0, 10.0, 27.0, 27.0, 21.0, 24.0, 23.0, 34.0, 36.0, 40.0, 29.0, 35.0, 35.0, 50.0, 27.0, 35.0, 31.0, 35.0, 47.0, 39.0, 37.0, 28.0, 31.0, 27.0, 24.0, 27.0, 20.0, 30.0, 13.0, 8.0, 7.0, 12.0, 13.0, 10.0, 8.0, 9.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.4453125, -5.27117919921875, -5.0970458984375, -4.92291259765625, -4.748779296875, -4.57464599609375, -4.4005126953125, -4.22637939453125, -4.05224609375, -3.87811279296875, -3.7039794921875, -3.52984619140625, -3.355712890625, -3.18157958984375, -3.0074462890625, -2.83331298828125, -2.6591796875, -2.48504638671875, -2.3109130859375, -2.13677978515625, -1.962646484375, -1.78851318359375, -1.6143798828125, -1.44024658203125, -1.26611328125, -1.09197998046875, -0.9178466796875, -0.74371337890625, -0.569580078125, -0.39544677734375, -0.2213134765625, -0.04718017578125, 0.126953125, 0.30108642578125, 0.4752197265625, 0.64935302734375, 0.823486328125, 0.99761962890625, 1.1717529296875, 1.34588623046875, 1.52001953125, 1.69415283203125, 1.8682861328125, 2.04241943359375, 2.216552734375, 2.39068603515625, 2.5648193359375, 2.73895263671875, 2.9130859375, 3.08721923828125, 3.2613525390625, 3.43548583984375, 3.609619140625, 3.78375244140625, 3.9578857421875, 4.13201904296875, 4.30615234375, 4.48028564453125, 4.6544189453125, 4.82855224609375, 5.002685546875, 5.17681884765625, 5.3509521484375, 5.52508544921875, 5.69921875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [4.0, 4.0, 4.0, 3.0, 6.0, 10.0, 17.0, 18.0, 33.0, 41.0, 62.0, 95.0, 131.0, 237.0, 315.0, 469.0, 817.0, 1306.0, 1991.0, 3487.0, 5804.0, 10005.0, 17553.0, 29898.0, 52735.0, 92772.0, 157548.0, 258381.0, 400755.0, 553709.0, 651292.0, 621259.0, 490498.0, 335773.0, 209862.0, 125312.0, 72733.0, 41613.0, 23775.0, 13715.0, 7978.0, 4776.0, 2796.0, 1732.0, 1013.0, 724.0, 403.0, 276.0, 197.0, 126.0, 76.0, 60.0, 31.0, 24.0, 20.0, 14.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.0390625, -5.8428955078125, -5.646728515625, -5.4505615234375, -5.25439453125, -5.0582275390625, -4.862060546875, -4.6658935546875, -4.4697265625, -4.2735595703125, -4.077392578125, -3.8812255859375, -3.68505859375, -3.4888916015625, -3.292724609375, -3.0965576171875, -2.900390625, -2.7042236328125, -2.508056640625, -2.3118896484375, -2.11572265625, -1.9195556640625, -1.723388671875, -1.5272216796875, -1.3310546875, -1.1348876953125, -0.938720703125, -0.7425537109375, -0.54638671875, -0.3502197265625, -0.154052734375, 0.0421142578125, 0.23828125, 0.4344482421875, 0.630615234375, 0.8267822265625, 1.02294921875, 1.2191162109375, 1.415283203125, 1.6114501953125, 1.8076171875, 2.0037841796875, 2.199951171875, 2.3961181640625, 2.59228515625, 2.7884521484375, 2.984619140625, 3.1807861328125, 3.376953125, 3.5731201171875, 3.769287109375, 3.9654541015625, 4.16162109375, 4.3577880859375, 4.553955078125, 4.7501220703125, 4.9462890625, 5.1424560546875, 5.338623046875, 5.5347900390625, 5.73095703125, 5.9271240234375, 6.123291015625, 6.3194580078125, 6.515625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 10.0, 7.0, 6.0, 11.0, 21.0, 12.0, 28.0, 35.0, 31.0, 36.0, 52.0, 70.0, 82.0, 100.0, 89.0, 104.0, 121.0, 174.0, 157.0, 191.0, 189.0, 195.0, 212.0, 219.0, 229.0, 204.0, 191.0, 176.0, 182.0, 157.0, 126.0, 124.0, 99.0, 75.0, 65.0, 60.0, 50.0, 44.0, 29.0, 25.0, 18.0, 12.0, 10.0, 18.0, 7.0, 4.0, 6.0, 5.0, 2.0, 3.0, 4.0], "bins": [-2.78125, -2.704833984375, -2.62841796875, -2.552001953125, -2.4755859375, -2.399169921875, -2.32275390625, -2.246337890625, -2.169921875, -2.093505859375, -2.01708984375, -1.940673828125, -1.8642578125, -1.787841796875, -1.71142578125, -1.635009765625, -1.55859375, -1.482177734375, -1.40576171875, -1.329345703125, -1.2529296875, -1.176513671875, -1.10009765625, -1.023681640625, -0.947265625, -0.870849609375, -0.79443359375, -0.718017578125, -0.6416015625, -0.565185546875, -0.48876953125, -0.412353515625, -0.3359375, -0.259521484375, -0.18310546875, -0.106689453125, -0.0302734375, 0.046142578125, 0.12255859375, 0.198974609375, 0.275390625, 0.351806640625, 0.42822265625, 0.504638671875, 0.5810546875, 0.657470703125, 0.73388671875, 0.810302734375, 0.88671875, 0.963134765625, 1.03955078125, 1.115966796875, 1.1923828125, 1.268798828125, 1.34521484375, 1.421630859375, 1.498046875, 1.574462890625, 1.65087890625, 1.727294921875, 1.8037109375, 1.880126953125, 1.95654296875, 2.032958984375, 2.109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 10.0, 8.0, 11.0, 16.0, 22.0, 19.0, 29.0, 32.0, 35.0, 31.0, 38.0, 42.0, 43.0, 57.0, 61.0, 46.0, 55.0, 59.0, 49.0, 42.0, 42.0, 41.0, 41.0, 31.0, 30.0, 21.0, 13.0, 14.0, 12.0, 8.0, 6.0, 8.0, 4.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6737213134765625, -7.430568695068359, -7.187416076660156, -6.944263458251953, -6.70111083984375, -6.457958221435547, -6.214806079864502, -5.971653461456299, -5.728500843048096, -5.485348224639893, -5.2421956062316895, -4.999042987823486, -4.755890846252441, -4.512738227844238, -4.269585609436035, -4.026432991027832, -3.783280372619629, -3.540127754211426, -3.2969751358032227, -3.0538227558135986, -2.8106701374053955, -2.5675175189971924, -2.3243651390075684, -2.0812125205993652, -1.838059902191162, -1.594907283782959, -1.3517547845840454, -1.1086022853851318, -0.8654496669769287, -0.6222970485687256, -0.379144549369812, -0.13599205017089844, 0.10716056823730469, 0.35031312704086304, 0.5934656858444214, 0.8366182446479797, 1.079770803451538, 1.3229234218597412, 1.5660759210586548, 1.8092284202575684, 2.0523810386657715, 2.2955336570739746, 2.5386862754821777, 2.7818386554718018, 3.024991273880005, 3.268143892288208, 3.511296272277832, 3.754448890686035, 3.9976015090942383, 4.240754127502441, 4.4839067459106445, 4.727059364318848, 4.970211982727051, 5.213364601135254, 5.456516742706299, 5.699669361114502, 5.942821979522705, 6.185974597930908, 6.429127216339111, 6.6722798347473145, 6.915431976318359, 7.1585845947265625, 7.401737213134766, 7.644889831542969, 7.888042449951172]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 10.0, 16.0, 14.0, 8.0, 12.0, 15.0, 13.0, 20.0, 22.0, 34.0, 22.0, 23.0, 22.0, 34.0, 25.0, 34.0, 33.0, 22.0, 43.0, 42.0, 27.0, 33.0, 31.0, 43.0, 39.0, 32.0, 31.0, 22.0, 34.0, 25.0, 23.0, 21.0, 33.0, 17.0, 15.0, 18.0, 17.0, 13.0, 6.0, 7.0, 7.0, 4.0, 10.0, 10.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.529283046722412, -5.338901996612549, -5.148521423339844, -4.9581403732299805, -4.767759323120117, -4.577378749847412, -4.386997699737549, -4.196617126464844, -4.0062360763549805, -3.8158552646636963, -3.625474214553833, -3.435093402862549, -3.2447125911712646, -3.0543317794799805, -2.863950729370117, -2.673569917678833, -2.4831888675689697, -2.2928080558776855, -2.1024270057678223, -1.912046194076538, -1.721665382385254, -1.5312844514846802, -1.3409035205841064, -1.1505227088928223, -0.9601417779922485, -0.7697609066963196, -0.5793800354003906, -0.3889991044998169, -0.19861823320388794, -0.008237361907958984, 0.18214356899261475, 0.3725243806838989, 0.5629053115844727, 0.7532861828804016, 0.9436670541763306, 1.1340479850769043, 1.3244287967681885, 1.5148097276687622, 1.705190658569336, 1.8955714702606201, 2.0859522819519043, 2.2763330936431885, 2.4667141437530518, 2.657094955444336, 2.84747576713562, 3.0378565788269043, 3.2282376289367676, 3.4186184406280518, 3.608999490737915, 3.799380302429199, 3.9897613525390625, 4.180142402648926, 4.370522975921631, 4.560904026031494, 4.751284599304199, 4.9416656494140625, 5.132046699523926, 5.322427749633789, 5.512808322906494, 5.703189373016357, 5.893570423126221, 6.083950996398926, 6.274332046508789, 6.464713096618652, 6.655093669891357]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 15.0, 26.0, 28.0, 42.0, 60.0, 78.0, 120.0, 185.0, 238.0, 340.0, 494.0, 666.0, 968.0, 1465.0, 2049.0, 3112.0, 4841.0, 7235.0, 11156.0, 17417.0, 27125.0, 43221.0, 68228.0, 105240.0, 148325.0, 169722.0, 146332.0, 103753.0, 66815.0, 42593.0, 27005.0, 16769.0, 10955.0, 6961.0, 4738.0, 3185.0, 2115.0, 1411.0, 1035.0, 740.0, 512.0, 393.0, 274.0, 166.0, 115.0, 79.0, 74.0, 37.0, 33.0, 24.0, 13.0, 6.0, 6.0, 8.0, 2.0, 1.0, 2.0], "bins": [-0.9697265625, -0.9398727416992188, -0.9100189208984375, -0.8801651000976562, -0.850311279296875, -0.8204574584960938, -0.7906036376953125, -0.7607498168945312, -0.73089599609375, -0.7010421752929688, -0.6711883544921875, -0.6413345336914062, -0.611480712890625, -0.5816268920898438, -0.5517730712890625, -0.5219192504882812, -0.4920654296875, -0.46221160888671875, -0.4323577880859375, -0.40250396728515625, -0.372650146484375, -0.34279632568359375, -0.3129425048828125, -0.28308868408203125, -0.25323486328125, -0.22338104248046875, -0.1935272216796875, -0.16367340087890625, -0.133819580078125, -0.10396575927734375, -0.0741119384765625, -0.04425811767578125, -0.014404296875, 0.01544952392578125, 0.0453033447265625, 0.07515716552734375, 0.105010986328125, 0.13486480712890625, 0.1647186279296875, 0.19457244873046875, 0.22442626953125, 0.25428009033203125, 0.2841339111328125, 0.31398773193359375, 0.343841552734375, 0.37369537353515625, 0.4035491943359375, 0.43340301513671875, 0.4632568359375, 0.49311065673828125, 0.5229644775390625, 0.5528182983398438, 0.582672119140625, 0.6125259399414062, 0.6423797607421875, 0.6722335815429688, 0.70208740234375, 0.7319412231445312, 0.7617950439453125, 0.7916488647460938, 0.821502685546875, 0.8513565063476562, 0.8812103271484375, 0.9110641479492188, 0.94091796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 5.0, 6.0, 12.0, 9.0, 8.0, 10.0, 15.0, 14.0, 18.0, 27.0, 26.0, 25.0, 31.0, 22.0, 39.0, 28.0, 23.0, 34.0, 32.0, 36.0, 49.0, 32.0, 42.0, 41.0, 27.0, 28.0, 31.0, 31.0, 29.0, 31.0, 28.0, 31.0, 29.0, 20.0, 18.0, 18.0, 16.0, 16.0, 13.0, 9.0, 7.0, 9.0, 3.0, 7.0, 3.0, 8.0, 3.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.165771484375, -5.96044921875, -5.755126953125, -5.5498046875, -5.344482421875, -5.13916015625, -4.933837890625, -4.728515625, -4.523193359375, -4.31787109375, -4.112548828125, -3.9072265625, -3.701904296875, -3.49658203125, -3.291259765625, -3.0859375, -2.880615234375, -2.67529296875, -2.469970703125, -2.2646484375, -2.059326171875, -1.85400390625, -1.648681640625, -1.443359375, -1.238037109375, -1.03271484375, -0.827392578125, -0.6220703125, -0.416748046875, -0.21142578125, -0.006103515625, 0.19921875, 0.404541015625, 0.60986328125, 0.815185546875, 1.0205078125, 1.225830078125, 1.43115234375, 1.636474609375, 1.841796875, 2.047119140625, 2.25244140625, 2.457763671875, 2.6630859375, 2.868408203125, 3.07373046875, 3.279052734375, 3.484375, 3.689697265625, 3.89501953125, 4.100341796875, 4.3056640625, 4.510986328125, 4.71630859375, 4.921630859375, 5.126953125, 5.332275390625, 5.53759765625, 5.742919921875, 5.9482421875, 6.153564453125, 6.35888671875, 6.564208984375, 6.76953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 13.0, 15.0, 19.0, 23.0, 29.0, 39.0, 48.0, 71.0, 94.0, 153.0, 189.0, 345.0, 481.0, 726.0, 1178.0, 1762.0, 2827.0, 4777.0, 7917.0, 14470.0, 30265.0, 160088.0, 702116.0, 69818.0, 22225.0, 11675.0, 6622.0, 3874.0, 2390.0, 1474.0, 939.0, 586.0, 400.0, 245.0, 192.0, 124.0, 94.0, 58.0, 44.0, 36.0, 28.0, 25.0, 14.0, 15.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.333984375, -2.25946044921875, -2.1849365234375, -2.11041259765625, -2.035888671875, -1.96136474609375, -1.8868408203125, -1.81231689453125, -1.73779296875, -1.66326904296875, -1.5887451171875, -1.51422119140625, -1.439697265625, -1.36517333984375, -1.2906494140625, -1.21612548828125, -1.1416015625, -1.06707763671875, -0.9925537109375, -0.91802978515625, -0.843505859375, -0.76898193359375, -0.6944580078125, -0.61993408203125, -0.54541015625, -0.47088623046875, -0.3963623046875, -0.32183837890625, -0.247314453125, -0.17279052734375, -0.0982666015625, -0.02374267578125, 0.05078125, 0.12530517578125, 0.1998291015625, 0.27435302734375, 0.348876953125, 0.42340087890625, 0.4979248046875, 0.57244873046875, 0.64697265625, 0.72149658203125, 0.7960205078125, 0.87054443359375, 0.945068359375, 1.01959228515625, 1.0941162109375, 1.16864013671875, 1.2431640625, 1.31768798828125, 1.3922119140625, 1.46673583984375, 1.541259765625, 1.61578369140625, 1.6903076171875, 1.76483154296875, 1.83935546875, 1.91387939453125, 1.9884033203125, 2.06292724609375, 2.137451171875, 2.21197509765625, 2.2864990234375, 2.36102294921875, 2.435546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 11.0, 13.0, 18.0, 22.0, 14.0, 37.0, 19.0, 24.0, 24.0, 33.0, 33.0, 39.0, 45.0, 50.0, 46.0, 40.0, 43.0, 41.0, 44.0, 45.0, 43.0, 35.0, 32.0, 24.0, 27.0, 29.0, 22.0, 25.0, 20.0, 17.0, 10.0, 17.0, 6.0, 9.0, 7.0, 6.0, 6.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.66796875, -5.5001220703125, -5.332275390625, -5.1644287109375, -4.99658203125, -4.8287353515625, -4.660888671875, -4.4930419921875, -4.3251953125, -4.1573486328125, -3.989501953125, -3.8216552734375, -3.65380859375, -3.4859619140625, -3.318115234375, -3.1502685546875, -2.982421875, -2.8145751953125, -2.646728515625, -2.4788818359375, -2.31103515625, -2.1431884765625, -1.975341796875, -1.8074951171875, -1.6396484375, -1.4718017578125, -1.303955078125, -1.1361083984375, -0.96826171875, -0.8004150390625, -0.632568359375, -0.4647216796875, -0.296875, -0.1290283203125, 0.038818359375, 0.2066650390625, 0.37451171875, 0.5423583984375, 0.710205078125, 0.8780517578125, 1.0458984375, 1.2137451171875, 1.381591796875, 1.5494384765625, 1.71728515625, 1.8851318359375, 2.052978515625, 2.2208251953125, 2.388671875, 2.5565185546875, 2.724365234375, 2.8922119140625, 3.06005859375, 3.2279052734375, 3.395751953125, 3.5635986328125, 3.7314453125, 3.8992919921875, 4.067138671875, 4.2349853515625, 4.40283203125, 4.5706787109375, 4.738525390625, 4.9063720703125, 5.07421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 7.0, 15.0, 10.0, 15.0, 18.0, 42.0, 50.0, 60.0, 90.0, 144.0, 188.0, 265.0, 411.0, 565.0, 952.0, 1367.0, 2112.0, 3286.0, 5471.0, 9096.0, 15963.0, 31132.0, 263547.0, 628567.0, 39220.0, 18164.0, 10376.0, 6322.0, 3815.0, 2364.0, 1603.0, 1046.0, 687.0, 440.0, 328.0, 197.0, 173.0, 131.0, 87.0, 64.0, 49.0, 28.0, 30.0, 21.0, 10.0, 9.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.42822265625, -0.4152946472167969, -0.40236663818359375, -0.3894386291503906, -0.3765106201171875, -0.3635826110839844, -0.35065460205078125, -0.3377265930175781, -0.324798583984375, -0.3118705749511719, -0.29894256591796875, -0.2860145568847656, -0.2730865478515625, -0.2601585388183594, -0.24723052978515625, -0.23430252075195312, -0.22137451171875, -0.20844650268554688, -0.19551849365234375, -0.18259048461914062, -0.1696624755859375, -0.15673446655273438, -0.14380645751953125, -0.13087844848632812, -0.117950439453125, -0.10502243041992188, -0.09209442138671875, -0.07916641235351562, -0.0662384033203125, -0.053310394287109375, -0.04038238525390625, -0.027454376220703125, -0.0145263671875, -0.001598358154296875, 0.01132965087890625, 0.024257659912109375, 0.0371856689453125, 0.050113677978515625, 0.06304168701171875, 0.07596969604492188, 0.088897705078125, 0.10182571411132812, 0.11475372314453125, 0.12768173217773438, 0.1406097412109375, 0.15353775024414062, 0.16646575927734375, 0.17939376831054688, 0.19232177734375, 0.20524978637695312, 0.21817779541015625, 0.23110580444335938, 0.2440338134765625, 0.2569618225097656, 0.26988983154296875, 0.2828178405761719, 0.295745849609375, 0.3086738586425781, 0.32160186767578125, 0.3345298767089844, 0.3474578857421875, 0.3603858947753906, 0.37331390380859375, 0.3862419128417969, 0.399169921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 4.0, 6.0, 11.0, 11.0, 9.0, 12.0, 13.0, 18.0, 21.0, 22.0, 25.0, 33.0, 31.0, 41.0, 56.0, 45.0, 52.0, 46.0, 50.0, 58.0, 42.0, 45.0, 44.0, 44.0, 34.0, 36.0, 19.0, 25.0, 18.0, 19.0, 24.0, 12.0, 11.0, 9.0, 6.0, 10.0, 4.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.245737075805664e-05, -1.2113712728023529e-05, -1.1770054697990417e-05, -1.1426396667957306e-05, -1.1082738637924194e-05, -1.0739080607891083e-05, -1.0395422577857971e-05, -1.005176454782486e-05, -9.708106517791748e-06, -9.364448487758636e-06, -9.020790457725525e-06, -8.677132427692413e-06, -8.333474397659302e-06, -7.98981636762619e-06, -7.646158337593079e-06, -7.302500307559967e-06, -6.9588422775268555e-06, -6.615184247493744e-06, -6.271526217460632e-06, -5.927868187427521e-06, -5.584210157394409e-06, -5.240552127361298e-06, -4.896894097328186e-06, -4.5532360672950745e-06, -4.209578037261963e-06, -3.865920007228851e-06, -3.5222619771957397e-06, -3.178603947162628e-06, -2.8349459171295166e-06, -2.491287887096405e-06, -2.1476298570632935e-06, -1.8039718270301819e-06, -1.4603137969970703e-06, -1.1166557669639587e-06, -7.729977369308472e-07, -4.293397068977356e-07, -8.568167686462402e-08, 2.5797635316848755e-07, 6.016343832015991e-07, 9.452924132347107e-07, 1.2889504432678223e-06, 1.6326084733009338e-06, 1.9762665033340454e-06, 2.319924533367157e-06, 2.6635825634002686e-06, 3.00724059343338e-06, 3.3508986234664917e-06, 3.6945566534996033e-06, 4.038214683532715e-06, 4.381872713565826e-06, 4.725530743598938e-06, 5.0691887736320496e-06, 5.412846803665161e-06, 5.756504833698273e-06, 6.100162863731384e-06, 6.443820893764496e-06, 6.787478923797607e-06, 7.131136953830719e-06, 7.4747949838638306e-06, 7.818453013896942e-06, 8.162111043930054e-06, 8.505769073963165e-06, 8.849427103996277e-06, 9.193085134029388e-06, 9.5367431640625e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 8.0, 12.0, 11.0, 21.0, 50.0, 43.0, 79.0, 114.0, 182.0, 250.0, 434.0, 668.0, 1044.0, 1604.0, 2615.0, 4494.0, 7555.0, 13621.0, 24495.0, 43915.0, 80250.0, 144688.0, 231839.0, 210738.0, 124514.0, 68386.0, 37485.0, 20748.0, 11857.0, 6738.0, 3774.0, 2331.0, 1468.0, 874.0, 556.0, 361.0, 233.0, 143.0, 115.0, 92.0, 48.0, 34.0, 25.0, 11.0, 10.0, 9.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4326171875, -0.4181327819824219, -0.40364837646484375, -0.3891639709472656, -0.3746795654296875, -0.3601951599121094, -0.34571075439453125, -0.3312263488769531, -0.316741943359375, -0.3022575378417969, -0.28777313232421875, -0.2732887268066406, -0.2588043212890625, -0.24431991577148438, -0.22983551025390625, -0.21535110473632812, -0.20086669921875, -0.18638229370117188, -0.17189788818359375, -0.15741348266601562, -0.1429290771484375, -0.12844467163085938, -0.11396026611328125, -0.09947586059570312, -0.084991455078125, -0.07050704956054688, -0.05602264404296875, -0.041538238525390625, -0.0270538330078125, -0.012569427490234375, 0.00191497802734375, 0.016399383544921875, 0.0308837890625, 0.045368194580078125, 0.05985260009765625, 0.07433700561523438, 0.0888214111328125, 0.10330581665039062, 0.11779022216796875, 0.13227462768554688, 0.146759033203125, 0.16124343872070312, 0.17572784423828125, 0.19021224975585938, 0.2046966552734375, 0.21918106079101562, 0.23366546630859375, 0.24814987182617188, 0.26263427734375, 0.2771186828613281, 0.29160308837890625, 0.3060874938964844, 0.3205718994140625, 0.3350563049316406, 0.34954071044921875, 0.3640251159667969, 0.378509521484375, 0.3929939270019531, 0.40747833251953125, 0.4219627380371094, 0.4364471435546875, 0.4509315490722656, 0.46541595458984375, 0.4799003601074219, 0.494384765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 7.0, 7.0, 11.0, 11.0, 17.0, 11.0, 21.0, 24.0, 35.0, 32.0, 37.0, 52.0, 54.0, 39.0, 50.0, 48.0, 42.0, 60.0, 58.0, 38.0, 40.0, 41.0, 28.0, 39.0, 27.0, 28.0, 21.0, 12.0, 14.0, 15.0, 9.0, 5.0, 11.0, 9.0, 9.0, 10.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.180908203125, -0.1750335693359375, -0.169158935546875, -0.1632843017578125, -0.15740966796875, -0.1515350341796875, -0.145660400390625, -0.1397857666015625, -0.1339111328125, -0.1280364990234375, -0.122161865234375, -0.1162872314453125, -0.11041259765625, -0.1045379638671875, -0.098663330078125, -0.0927886962890625, -0.0869140625, -0.0810394287109375, -0.075164794921875, -0.0692901611328125, -0.06341552734375, -0.0575408935546875, -0.051666259765625, -0.0457916259765625, -0.0399169921875, -0.0340423583984375, -0.028167724609375, -0.0222930908203125, -0.01641845703125, -0.0105438232421875, -0.004669189453125, 0.0012054443359375, 0.007080078125, 0.0129547119140625, 0.018829345703125, 0.0247039794921875, 0.03057861328125, 0.0364532470703125, 0.042327880859375, 0.0482025146484375, 0.0540771484375, 0.0599517822265625, 0.065826416015625, 0.0717010498046875, 0.07757568359375, 0.0834503173828125, 0.089324951171875, 0.0951995849609375, 0.10107421875, 0.1069488525390625, 0.112823486328125, 0.1186981201171875, 0.12457275390625, 0.1304473876953125, 0.136322021484375, 0.1421966552734375, 0.1480712890625, 0.1539459228515625, 0.159820556640625, 0.1656951904296875, 0.17156982421875, 0.1774444580078125, 0.183319091796875, 0.1891937255859375, 0.195068359375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 11.0, 14.0, 18.0, 24.0, 23.0, 31.0, 32.0, 31.0, 38.0, 36.0, 40.0, 51.0, 62.0, 45.0, 51.0, 55.0, 61.0, 39.0, 45.0, 48.0, 31.0, 39.0, 32.0, 23.0, 18.0, 20.0, 11.0, 9.0, 10.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.420277118682861, -7.18087911605835, -6.94148063659668, -6.702082633972168, -6.462684631347656, -6.2232866287231445, -5.983888149261475, -5.744490146636963, -5.505091667175293, -5.265693664550781, -5.026295185089111, -4.7868971824646, -4.547499179840088, -4.308100700378418, -4.068702697753906, -3.8293046951293945, -3.589906692504883, -3.350508451461792, -3.1111104488372803, -2.8717122077941895, -2.6323142051696777, -2.392915964126587, -2.153517723083496, -1.9141196012496948, -1.6747214794158936, -1.4353233575820923, -1.195925235748291, -0.9565269947052002, -0.7171288728713989, -0.47773075103759766, -0.23833250999450684, 0.0010656118392944336, 0.2404632568359375, 0.47986140847206116, 0.7192595601081848, 0.9586577415466309, 1.1980558633804321, 1.4374539852142334, 1.6768522262573242, 1.9162503480911255, 2.1556484699249268, 2.3950467109680176, 2.6344447135925293, 2.87384295463562, 3.113241195678711, 3.3526391983032227, 3.5920374393463135, 3.8314356803894043, 4.070833683013916, 4.310231685638428, 4.549630165100098, 4.789028167724609, 5.028426170349121, 5.267824172973633, 5.507222652435303, 5.7466206550598145, 5.986019134521484, 6.225417137145996, 6.464815616607666, 6.704213619232178, 6.9436116218566895, 7.183010101318359, 7.422408103942871, 7.661806106567383, 7.9012041091918945]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 2.0, 7.0, 11.0, 16.0, 9.0, 12.0, 13.0, 14.0, 14.0, 18.0, 25.0, 30.0, 18.0, 20.0, 31.0, 31.0, 31.0, 28.0, 31.0, 32.0, 35.0, 41.0, 29.0, 28.0, 40.0, 43.0, 32.0, 37.0, 28.0, 24.0, 32.0, 21.0, 24.0, 31.0, 21.0, 21.0, 15.0, 19.0, 14.0, 16.0, 5.0, 5.0, 8.0, 6.0, 12.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.447953224182129, -5.259078502655029, -5.0702033042907715, -4.881328582763672, -4.692453861236572, -4.503579139709473, -4.314703941345215, -4.125829219818115, -3.9369542598724365, -3.748079299926758, -3.559204578399658, -3.3703296184539795, -3.181454658508301, -2.992579936981201, -2.8037049770355225, -2.6148300170898438, -2.425955295562744, -2.2370803356170654, -2.048205614089966, -1.859330654144287, -1.670455813407898, -1.4815809726715088, -1.29270601272583, -1.103831171989441, -0.9149563312530518, -0.7260814905166626, -0.5372065901756287, -0.3483316898345947, -0.15945684909820557, 0.029417991638183594, 0.2182929515838623, 0.40716779232025146, 0.5960426330566406, 0.7849174737930298, 0.9737923741340637, 1.1626672744750977, 1.3515421152114868, 1.540416955947876, 1.7292919158935547, 1.9181667566299438, 2.107041597366333, 2.2959165573120117, 2.4847912788391113, 2.67366623878479, 2.8625411987304688, 3.0514159202575684, 3.240290880203247, 3.429165840148926, 3.6180405616760254, 3.806915521621704, 3.9957902431488037, 4.184665203094482, 4.373539924621582, 4.56241512298584, 4.7512898445129395, 4.940164566040039, 5.129039764404297, 5.3179144859313965, 5.506789684295654, 5.695664405822754, 5.8845391273498535, 6.073413848876953, 6.262289047241211, 6.4511637687683105, 6.64003849029541]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 11.0, 12.0, 22.0, 39.0, 64.0, 85.0, 132.0, 228.0, 337.0, 476.0, 723.0, 1218.0, 1743.0, 2761.0, 4107.0, 6329.0, 10111.0, 15051.0, 23146.0, 34993.0, 52668.0, 75207.0, 101137.0, 123102.0, 132427.0, 123875.0, 103196.0, 76800.0, 53881.0, 36021.0, 24002.0, 15510.0, 10013.0, 6673.0, 4310.0, 2880.0, 1860.0, 1211.0, 803.0, 506.0, 322.0, 183.0, 121.0, 79.0, 63.0, 36.0, 35.0, 18.0, 11.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.55078125, -4.4017333984375, -4.252685546875, -4.1036376953125, -3.95458984375, -3.8055419921875, -3.656494140625, -3.5074462890625, -3.3583984375, -3.2093505859375, -3.060302734375, -2.9112548828125, -2.76220703125, -2.6131591796875, -2.464111328125, -2.3150634765625, -2.166015625, -2.0169677734375, -1.867919921875, -1.7188720703125, -1.56982421875, -1.4207763671875, -1.271728515625, -1.1226806640625, -0.9736328125, -0.8245849609375, -0.675537109375, -0.5264892578125, -0.37744140625, -0.2283935546875, -0.079345703125, 0.0697021484375, 0.21875, 0.3677978515625, 0.516845703125, 0.6658935546875, 0.81494140625, 0.9639892578125, 1.113037109375, 1.2620849609375, 1.4111328125, 1.5601806640625, 1.709228515625, 1.8582763671875, 2.00732421875, 2.1563720703125, 2.305419921875, 2.4544677734375, 2.603515625, 2.7525634765625, 2.901611328125, 3.0506591796875, 3.19970703125, 3.3487548828125, 3.497802734375, 3.6468505859375, 3.7958984375, 3.9449462890625, 4.093994140625, 4.2430419921875, 4.39208984375, 4.5411376953125, 4.690185546875, 4.8392333984375, 4.98828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 10.0, 14.0, 8.0, 16.0, 8.0, 15.0, 12.0, 11.0, 20.0, 19.0, 21.0, 24.0, 23.0, 37.0, 27.0, 32.0, 28.0, 33.0, 46.0, 27.0, 31.0, 44.0, 33.0, 40.0, 24.0, 33.0, 28.0, 37.0, 28.0, 31.0, 28.0, 30.0, 20.0, 32.0, 13.0, 19.0, 13.0, 17.0, 10.0, 12.0, 7.0, 7.0, 5.0, 7.0, 5.0, 4.0, 8.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.0625, -5.87188720703125, -5.6812744140625, -5.49066162109375, -5.300048828125, -5.10943603515625, -4.9188232421875, -4.72821044921875, -4.53759765625, -4.34698486328125, -4.1563720703125, -3.96575927734375, -3.775146484375, -3.58453369140625, -3.3939208984375, -3.20330810546875, -3.0126953125, -2.82208251953125, -2.6314697265625, -2.44085693359375, -2.250244140625, -2.05963134765625, -1.8690185546875, -1.67840576171875, -1.48779296875, -1.29718017578125, -1.1065673828125, -0.91595458984375, -0.725341796875, -0.53472900390625, -0.3441162109375, -0.15350341796875, 0.037109375, 0.22772216796875, 0.4183349609375, 0.60894775390625, 0.799560546875, 0.99017333984375, 1.1807861328125, 1.37139892578125, 1.56201171875, 1.75262451171875, 1.9432373046875, 2.13385009765625, 2.324462890625, 2.51507568359375, 2.7056884765625, 2.89630126953125, 3.0869140625, 3.27752685546875, 3.4681396484375, 3.65875244140625, 3.849365234375, 4.03997802734375, 4.2305908203125, 4.42120361328125, 4.61181640625, 4.80242919921875, 4.9930419921875, 5.18365478515625, 5.374267578125, 5.56488037109375, 5.7554931640625, 5.94610595703125, 6.13671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 7.0, 6.0, 13.0, 24.0, 42.0, 38.0, 70.0, 84.0, 151.0, 211.0, 309.0, 544.0, 739.0, 1198.0, 1716.0, 2784.0, 4351.0, 6621.0, 10362.0, 16088.0, 25301.0, 38957.0, 57963.0, 83142.0, 110704.0, 131870.0, 136105.0, 121862.0, 95834.0, 68977.0, 46793.0, 30395.0, 19565.0, 12727.0, 8127.0, 5303.0, 3234.0, 2222.0, 1406.0, 895.0, 621.0, 401.0, 249.0, 196.0, 110.0, 88.0, 53.0, 22.0, 25.0, 18.0, 8.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 5.0], "bins": [-5.33203125, -5.16656494140625, -5.0010986328125, -4.83563232421875, -4.670166015625, -4.50469970703125, -4.3392333984375, -4.17376708984375, -4.00830078125, -3.84283447265625, -3.6773681640625, -3.51190185546875, -3.346435546875, -3.18096923828125, -3.0155029296875, -2.85003662109375, -2.6845703125, -2.51910400390625, -2.3536376953125, -2.18817138671875, -2.022705078125, -1.85723876953125, -1.6917724609375, -1.52630615234375, -1.36083984375, -1.19537353515625, -1.0299072265625, -0.86444091796875, -0.698974609375, -0.53350830078125, -0.3680419921875, -0.20257568359375, -0.037109375, 0.12835693359375, 0.2938232421875, 0.45928955078125, 0.624755859375, 0.79022216796875, 0.9556884765625, 1.12115478515625, 1.28662109375, 1.45208740234375, 1.6175537109375, 1.78302001953125, 1.948486328125, 2.11395263671875, 2.2794189453125, 2.44488525390625, 2.6103515625, 2.77581787109375, 2.9412841796875, 3.10675048828125, 3.272216796875, 3.43768310546875, 3.6031494140625, 3.76861572265625, 3.93408203125, 4.09954833984375, 4.2650146484375, 4.43048095703125, 4.595947265625, 4.76141357421875, 4.9268798828125, 5.09234619140625, 5.2578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 7.0, 9.0, 7.0, 14.0, 10.0, 7.0, 15.0, 21.0, 30.0, 27.0, 23.0, 40.0, 44.0, 44.0, 42.0, 42.0, 43.0, 39.0, 37.0, 36.0, 42.0, 59.0, 43.0, 35.0, 28.0, 28.0, 26.0, 30.0, 24.0, 20.0, 19.0, 20.0, 14.0, 15.0, 8.0, 9.0, 4.0, 9.0, 6.0, 5.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.75390625, -4.616455078125, -4.47900390625, -4.341552734375, -4.2041015625, -4.066650390625, -3.92919921875, -3.791748046875, -3.654296875, -3.516845703125, -3.37939453125, -3.241943359375, -3.1044921875, -2.967041015625, -2.82958984375, -2.692138671875, -2.5546875, -2.417236328125, -2.27978515625, -2.142333984375, -2.0048828125, -1.867431640625, -1.72998046875, -1.592529296875, -1.455078125, -1.317626953125, -1.18017578125, -1.042724609375, -0.9052734375, -0.767822265625, -0.63037109375, -0.492919921875, -0.35546875, -0.218017578125, -0.08056640625, 0.056884765625, 0.1943359375, 0.331787109375, 0.46923828125, 0.606689453125, 0.744140625, 0.881591796875, 1.01904296875, 1.156494140625, 1.2939453125, 1.431396484375, 1.56884765625, 1.706298828125, 1.84375, 1.981201171875, 2.11865234375, 2.256103515625, 2.3935546875, 2.531005859375, 2.66845703125, 2.805908203125, 2.943359375, 3.080810546875, 3.21826171875, 3.355712890625, 3.4931640625, 3.630615234375, 3.76806640625, 3.905517578125, 4.04296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [7.0, 4.0, 6.0, 5.0, 19.0, 22.0, 20.0, 44.0, 64.0, 74.0, 131.0, 181.0, 278.0, 409.0, 534.0, 773.0, 1139.0, 1685.0, 2364.0, 3623.0, 5222.0, 7692.0, 10990.0, 16280.0, 23366.0, 32961.0, 45029.0, 59869.0, 76671.0, 91561.0, 103015.0, 105562.0, 100971.0, 88300.0, 72385.0, 56547.0, 41858.0, 30396.0, 21397.0, 14840.0, 10124.0, 6976.0, 4786.0, 3282.0, 2253.0, 1532.0, 1023.0, 719.0, 506.0, 298.0, 250.0, 173.0, 101.0, 68.0, 61.0, 40.0, 31.0, 23.0, 13.0, 9.0, 8.0, 3.0, 2.0, 1.0], "bins": [-1.359375, -1.3160552978515625, -1.272735595703125, -1.2294158935546875, -1.18609619140625, -1.1427764892578125, -1.099456787109375, -1.0561370849609375, -1.0128173828125, -0.9694976806640625, -0.926177978515625, -0.8828582763671875, -0.83953857421875, -0.7962188720703125, -0.752899169921875, -0.7095794677734375, -0.666259765625, -0.6229400634765625, -0.579620361328125, -0.5363006591796875, -0.49298095703125, -0.4496612548828125, -0.406341552734375, -0.3630218505859375, -0.3197021484375, -0.2763824462890625, -0.233062744140625, -0.1897430419921875, -0.14642333984375, -0.1031036376953125, -0.059783935546875, -0.0164642333984375, 0.02685546875, 0.0701751708984375, 0.113494873046875, 0.1568145751953125, 0.20013427734375, 0.2434539794921875, 0.286773681640625, 0.3300933837890625, 0.3734130859375, 0.4167327880859375, 0.460052490234375, 0.5033721923828125, 0.54669189453125, 0.5900115966796875, 0.633331298828125, 0.6766510009765625, 0.719970703125, 0.7632904052734375, 0.806610107421875, 0.8499298095703125, 0.89324951171875, 0.9365692138671875, 0.979888916015625, 1.0232086181640625, 1.0665283203125, 1.1098480224609375, 1.153167724609375, 1.1964874267578125, 1.23980712890625, 1.2831268310546875, 1.326446533203125, 1.3697662353515625, 1.4130859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 8.0, 4.0, 10.0, 12.0, 16.0, 20.0, 7.0, 25.0, 27.0, 27.0, 35.0, 31.0, 42.0, 36.0, 36.0, 40.0, 37.0, 45.0, 42.0, 47.0, 46.0, 42.0, 41.0, 39.0, 36.0, 31.0, 31.0, 23.0, 34.0, 16.0, 21.0, 17.0, 12.0, 9.0, 14.0, 7.0, 3.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00018095970153808594, -0.00017508119344711304, -0.00016920268535614014, -0.00016332417726516724, -0.00015744566917419434, -0.00015156716108322144, -0.00014568865299224854, -0.00013981014490127563, -0.00013393163681030273, -0.00012805312871932983, -0.00012217462062835693, -0.00011629611253738403, -0.00011041760444641113, -0.00010453909635543823, -9.866058826446533e-05, -9.278208017349243e-05, -8.690357208251953e-05, -8.102506399154663e-05, -7.514655590057373e-05, -6.926804780960083e-05, -6.338953971862793e-05, -5.751103162765503e-05, -5.163252353668213e-05, -4.575401544570923e-05, -3.987550735473633e-05, -3.399699926376343e-05, -2.8118491172790527e-05, -2.2239983081817627e-05, -1.6361474990844727e-05, -1.0482966899871826e-05, -4.604458808898926e-06, 1.2740492820739746e-06, 7.152557373046875e-06, 1.3031065464019775e-05, 1.8909573554992676e-05, 2.4788081645965576e-05, 3.0666589736938477e-05, 3.654509782791138e-05, 4.242360591888428e-05, 4.830211400985718e-05, 5.418062210083008e-05, 6.005913019180298e-05, 6.593763828277588e-05, 7.181614637374878e-05, 7.769465446472168e-05, 8.357316255569458e-05, 8.945167064666748e-05, 9.533017873764038e-05, 0.00010120868682861328, 0.00010708719491958618, 0.00011296570301055908, 0.00011884421110153198, 0.00012472271919250488, 0.00013060122728347778, 0.00013647973537445068, 0.00014235824346542358, 0.00014823675155639648, 0.00015411525964736938, 0.00015999376773834229, 0.00016587227582931519, 0.00017175078392028809, 0.00017762929201126099, 0.0001835078001022339, 0.0001893863081932068, 0.0001952648162841797]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 20.0, 34.0, 26.0, 54.0, 72.0, 114.0, 164.0, 242.0, 400.0, 541.0, 779.0, 1268.0, 1891.0, 2896.0, 4453.0, 6719.0, 9989.0, 15209.0, 22965.0, 33277.0, 46945.0, 63210.0, 81036.0, 97557.0, 108766.0, 110798.0, 103063.0, 88788.0, 71555.0, 54268.0, 39164.0, 27368.0, 18615.0, 12264.0, 8313.0, 5307.0, 3620.0, 2283.0, 1513.0, 1015.0, 687.0, 452.0, 259.0, 171.0, 132.0, 96.0, 56.0, 40.0, 18.0, 12.0, 15.0, 20.0, 11.0, 4.0, 2.0, 6.0], "bins": [-1.578125, -1.5306396484375, -1.483154296875, -1.4356689453125, -1.38818359375, -1.3406982421875, -1.293212890625, -1.2457275390625, -1.1982421875, -1.1507568359375, -1.103271484375, -1.0557861328125, -1.00830078125, -0.9608154296875, -0.913330078125, -0.8658447265625, -0.818359375, -0.7708740234375, -0.723388671875, -0.6759033203125, -0.62841796875, -0.5809326171875, -0.533447265625, -0.4859619140625, -0.4384765625, -0.3909912109375, -0.343505859375, -0.2960205078125, -0.24853515625, -0.2010498046875, -0.153564453125, -0.1060791015625, -0.05859375, -0.0111083984375, 0.036376953125, 0.0838623046875, 0.13134765625, 0.1788330078125, 0.226318359375, 0.2738037109375, 0.3212890625, 0.3687744140625, 0.416259765625, 0.4637451171875, 0.51123046875, 0.5587158203125, 0.606201171875, 0.6536865234375, 0.701171875, 0.7486572265625, 0.796142578125, 0.8436279296875, 0.89111328125, 0.9385986328125, 0.986083984375, 1.0335693359375, 1.0810546875, 1.1285400390625, 1.176025390625, 1.2235107421875, 1.27099609375, 1.3184814453125, 1.365966796875, 1.4134521484375, 1.4609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 6.0, 9.0, 20.0, 16.0, 11.0, 22.0, 16.0, 24.0, 27.0, 33.0, 36.0, 44.0, 35.0, 44.0, 50.0, 52.0, 46.0, 42.0, 56.0, 42.0, 39.0, 50.0, 26.0, 38.0, 41.0, 26.0, 25.0, 22.0, 18.0, 18.0, 15.0, 8.0, 8.0, 6.0, 6.0, 6.0, 4.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.8759765625, -0.8523330688476562, -0.8286895751953125, -0.8050460815429688, -0.781402587890625, -0.7577590942382812, -0.7341156005859375, -0.7104721069335938, -0.68682861328125, -0.6631851196289062, -0.6395416259765625, -0.6158981323242188, -0.592254638671875, -0.5686111450195312, -0.5449676513671875, -0.5213241577148438, -0.4976806640625, -0.47403717041015625, -0.4503936767578125, -0.42675018310546875, -0.403106689453125, -0.37946319580078125, -0.3558197021484375, -0.33217620849609375, -0.30853271484375, -0.28488922119140625, -0.2612457275390625, -0.23760223388671875, -0.213958740234375, -0.19031524658203125, -0.1666717529296875, -0.14302825927734375, -0.119384765625, -0.09574127197265625, -0.0720977783203125, -0.04845428466796875, -0.024810791015625, -0.00116729736328125, 0.0224761962890625, 0.04611968994140625, 0.06976318359375, 0.09340667724609375, 0.1170501708984375, 0.14069366455078125, 0.164337158203125, 0.18798065185546875, 0.2116241455078125, 0.23526763916015625, 0.2589111328125, 0.28255462646484375, 0.3061981201171875, 0.32984161376953125, 0.353485107421875, 0.37712860107421875, 0.4007720947265625, 0.42441558837890625, 0.44805908203125, 0.47170257568359375, 0.4953460693359375, 0.5189895629882812, 0.542633056640625, 0.5662765502929688, 0.5899200439453125, 0.6135635375976562, 0.63720703125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 16.0, 6.0, 12.0, 12.0, 21.0, 20.0, 18.0, 36.0, 32.0, 39.0, 44.0, 41.0, 39.0, 50.0, 52.0, 58.0, 59.0, 54.0, 58.0, 60.0, 39.0, 46.0, 40.0, 27.0, 19.0, 25.0, 15.0, 10.0, 9.0, 9.0, 7.0, 5.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.592833042144775, -7.343437194824219, -7.094040870666504, -6.844645023345947, -6.595248699188232, -6.345852851867676, -6.096456527709961, -5.847060680389404, -5.597664833068848, -5.348268985748291, -5.098872661590576, -4.8494768142700195, -4.600080490112305, -4.350684642791748, -4.101288795471191, -3.8518924713134766, -3.6024961471557617, -3.353100061416626, -3.1037039756774902, -2.8543081283569336, -2.6049118041992188, -2.355515956878662, -2.1061198711395264, -1.8567237854003906, -1.6073276996612549, -1.3579316139221191, -1.1085355281829834, -0.8591395616531372, -0.6097434759140015, -0.3603473901748657, -0.11095142364501953, 0.1384446620941162, 0.38784122467041016, 0.6372373104095459, 0.8866333365440369, 1.1360293626785278, 1.3854254484176636, 1.6348215341567993, 1.8842175006866455, 2.1336135864257812, 2.383009672164917, 2.6324057579040527, 2.8818018436431885, 3.131197929382324, 3.380593776702881, 3.6299901008605957, 3.8793859481811523, 4.128782272338867, 4.378178119659424, 4.6275739669799805, 4.876970291137695, 5.126366138458252, 5.375762462615967, 5.625158309936523, 5.874554634094238, 6.123950481414795, 6.373346328735352, 6.622742176055908, 6.872138500213623, 7.12153434753418, 7.3709306716918945, 7.620326519012451, 7.869722366333008, 8.119118690490723, 8.368515014648438]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 10.0, 8.0, 12.0, 12.0, 23.0, 17.0, 19.0, 16.0, 23.0, 21.0, 25.0, 30.0, 32.0, 31.0, 32.0, 37.0, 38.0, 26.0, 31.0, 24.0, 45.0, 28.0, 44.0, 30.0, 30.0, 34.0, 31.0, 27.0, 24.0, 26.0, 24.0, 26.0, 19.0, 27.0, 21.0, 11.0, 19.0, 10.0, 9.0, 9.0, 6.0, 8.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.416293621063232, -6.203879356384277, -5.9914655685424805, -5.779051303863525, -5.56663703918457, -5.354223251342773, -5.141808986663818, -4.929394721984863, -4.716980934143066, -4.504566669464111, -4.2921528816223145, -4.079738616943359, -3.8673243522644043, -3.6549103260040283, -3.4424962997436523, -3.2300820350646973, -3.017667770385742, -2.805253744125366, -2.592839479446411, -2.380425453186035, -2.16801118850708, -1.955597162246704, -1.7431831359863281, -1.5307689905166626, -1.318354845046997, -1.1059406995773315, -0.8935266137123108, -0.68111252784729, -0.4686983823776245, -0.256284236907959, -0.04387021064758301, 0.16854393482208252, 0.38095808029174805, 0.5933722257614136, 0.8057863116264343, 1.018200397491455, 1.2306145429611206, 1.4430286884307861, 1.655442714691162, 1.8678568601608276, 2.080271005630493, 2.292685031890869, 2.505099296569824, 2.7175133228302, 2.929927349090576, 3.1423416137695312, 3.3547556400299072, 3.567169666290283, 3.7795839309692383, 3.9919979572296143, 4.20441198348999, 4.416826248168945, 4.6292405128479, 4.8416547775268555, 5.054068565368652, 5.266482830047607, 5.4788970947265625, 5.691311359405518, 5.9037251472473145, 6.1161394119262695, 6.328553676605225, 6.54096794128418, 6.753381729125977, 6.965795993804932, 7.1782097816467285]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 7.0, 6.0, 7.0, 16.0, 26.0, 41.0, 50.0, 71.0, 114.0, 122.0, 237.0, 304.0, 472.0, 729.0, 1057.0, 1643.0, 2586.0, 3909.0, 6308.0, 10318.0, 16873.0, 28395.0, 49222.0, 84050.0, 145717.0, 246840.0, 394098.0, 559052.0, 664900.0, 639527.0, 502421.0, 337820.0, 205889.0, 120621.0, 69728.0, 40102.0, 23639.0, 14168.0, 8588.0, 5114.0, 3352.0, 2100.0, 1394.0, 887.0, 580.0, 395.0, 251.0, 172.0, 138.0, 84.0, 54.0, 37.0, 17.0, 13.0, 12.0, 11.0, 4.0, 2.0, 1.0, 2.0, 3.0], "bins": [-6.06640625, -5.87579345703125, -5.6851806640625, -5.49456787109375, -5.303955078125, -5.11334228515625, -4.9227294921875, -4.73211669921875, -4.54150390625, -4.35089111328125, -4.1602783203125, -3.96966552734375, -3.779052734375, -3.58843994140625, -3.3978271484375, -3.20721435546875, -3.0166015625, -2.82598876953125, -2.6353759765625, -2.44476318359375, -2.254150390625, -2.06353759765625, -1.8729248046875, -1.68231201171875, -1.49169921875, -1.30108642578125, -1.1104736328125, -0.91986083984375, -0.729248046875, -0.53863525390625, -0.3480224609375, -0.15740966796875, 0.033203125, 0.22381591796875, 0.4144287109375, 0.60504150390625, 0.795654296875, 0.98626708984375, 1.1768798828125, 1.36749267578125, 1.55810546875, 1.74871826171875, 1.9393310546875, 2.12994384765625, 2.320556640625, 2.51116943359375, 2.7017822265625, 2.89239501953125, 3.0830078125, 3.27362060546875, 3.4642333984375, 3.65484619140625, 3.845458984375, 4.03607177734375, 4.2266845703125, 4.41729736328125, 4.60791015625, 4.79852294921875, 4.9891357421875, 5.17974853515625, 5.370361328125, 5.56097412109375, 5.7515869140625, 5.94219970703125, 6.1328125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 2.0, 5.0, 7.0, 3.0, 9.0, 18.0, 11.0, 21.0, 18.0, 25.0, 24.0, 15.0, 19.0, 29.0, 26.0, 46.0, 35.0, 30.0, 38.0, 28.0, 25.0, 33.0, 43.0, 42.0, 33.0, 37.0, 43.0, 26.0, 33.0, 36.0, 32.0, 21.0, 22.0, 26.0, 17.0, 17.0, 16.0, 21.0, 13.0, 8.0, 9.0, 4.0, 12.0, 9.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.671875, -6.47222900390625, -6.2725830078125, -6.07293701171875, -5.873291015625, -5.67364501953125, -5.4739990234375, -5.27435302734375, -5.07470703125, -4.87506103515625, -4.6754150390625, -4.47576904296875, -4.276123046875, -4.07647705078125, -3.8768310546875, -3.67718505859375, -3.4775390625, -3.27789306640625, -3.0782470703125, -2.87860107421875, -2.678955078125, -2.47930908203125, -2.2796630859375, -2.08001708984375, -1.88037109375, -1.68072509765625, -1.4810791015625, -1.28143310546875, -1.081787109375, -0.88214111328125, -0.6824951171875, -0.48284912109375, -0.283203125, -0.08355712890625, 0.1160888671875, 0.31573486328125, 0.515380859375, 0.71502685546875, 0.9146728515625, 1.11431884765625, 1.31396484375, 1.51361083984375, 1.7132568359375, 1.91290283203125, 2.112548828125, 2.31219482421875, 2.5118408203125, 2.71148681640625, 2.9111328125, 3.11077880859375, 3.3104248046875, 3.51007080078125, 3.709716796875, 3.90936279296875, 4.1090087890625, 4.30865478515625, 4.50830078125, 4.70794677734375, 4.9075927734375, 5.10723876953125, 5.306884765625, 5.50653076171875, 5.7061767578125, 5.90582275390625, 6.10546875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 12.0, 7.0, 10.0, 19.0, 44.0, 35.0, 88.0, 110.0, 188.0, 314.0, 464.0, 793.0, 1155.0, 1925.0, 3131.0, 5099.0, 8658.0, 14456.0, 24369.0, 41755.0, 69731.0, 117716.0, 193883.0, 303772.0, 439761.0, 566221.0, 617926.0, 563742.0, 437269.0, 300799.0, 192669.0, 117237.0, 69247.0, 41408.0, 24298.0, 14169.0, 8539.0, 5087.0, 3057.0, 1873.0, 1208.0, 744.0, 501.0, 273.0, 193.0, 102.0, 85.0, 58.0, 31.0, 22.0, 15.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40625, -6.18902587890625, -5.9718017578125, -5.75457763671875, -5.537353515625, -5.32012939453125, -5.1029052734375, -4.88568115234375, -4.66845703125, -4.45123291015625, -4.2340087890625, -4.01678466796875, -3.799560546875, -3.58233642578125, -3.3651123046875, -3.14788818359375, -2.9306640625, -2.71343994140625, -2.4962158203125, -2.27899169921875, -2.061767578125, -1.84454345703125, -1.6273193359375, -1.41009521484375, -1.19287109375, -0.97564697265625, -0.7584228515625, -0.54119873046875, -0.323974609375, -0.10675048828125, 0.1104736328125, 0.32769775390625, 0.544921875, 0.76214599609375, 0.9793701171875, 1.19659423828125, 1.413818359375, 1.63104248046875, 1.8482666015625, 2.06549072265625, 2.28271484375, 2.49993896484375, 2.7171630859375, 2.93438720703125, 3.151611328125, 3.36883544921875, 3.5860595703125, 3.80328369140625, 4.0205078125, 4.23773193359375, 4.4549560546875, 4.67218017578125, 4.889404296875, 5.10662841796875, 5.3238525390625, 5.54107666015625, 5.75830078125, 5.97552490234375, 6.1927490234375, 6.40997314453125, 6.627197265625, 6.84442138671875, 7.0616455078125, 7.27886962890625, 7.49609375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 11.0, 7.0, 16.0, 25.0, 24.0, 25.0, 36.0, 51.0, 58.0, 59.0, 86.0, 89.0, 99.0, 119.0, 132.0, 160.0, 163.0, 182.0, 200.0, 225.0, 215.0, 230.0, 207.0, 195.0, 206.0, 193.0, 188.0, 138.0, 134.0, 105.0, 87.0, 75.0, 58.0, 53.0, 57.0, 30.0, 32.0, 24.0, 13.0, 15.0, 11.0, 2.0, 6.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8984375, -2.805145263671875, -2.71185302734375, -2.618560791015625, -2.5252685546875, -2.431976318359375, -2.33868408203125, -2.245391845703125, -2.152099609375, -2.058807373046875, -1.96551513671875, -1.872222900390625, -1.7789306640625, -1.685638427734375, -1.59234619140625, -1.499053955078125, -1.40576171875, -1.312469482421875, -1.21917724609375, -1.125885009765625, -1.0325927734375, -0.939300537109375, -0.84600830078125, -0.752716064453125, -0.659423828125, -0.566131591796875, -0.47283935546875, -0.379547119140625, -0.2862548828125, -0.192962646484375, -0.09967041015625, -0.006378173828125, 0.0869140625, 0.180206298828125, 0.27349853515625, 0.366790771484375, 0.4600830078125, 0.553375244140625, 0.64666748046875, 0.739959716796875, 0.833251953125, 0.926544189453125, 1.01983642578125, 1.113128662109375, 1.2064208984375, 1.299713134765625, 1.39300537109375, 1.486297607421875, 1.57958984375, 1.672882080078125, 1.76617431640625, 1.859466552734375, 1.9527587890625, 2.046051025390625, 2.13934326171875, 2.232635498046875, 2.325927734375, 2.419219970703125, 2.51251220703125, 2.605804443359375, 2.6990966796875, 2.792388916015625, 2.88568115234375, 2.978973388671875, 3.072265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 11.0, 7.0, 13.0, 16.0, 11.0, 17.0, 13.0, 24.0, 29.0, 37.0, 30.0, 42.0, 38.0, 50.0, 57.0, 40.0, 50.0, 48.0, 35.0, 55.0, 44.0, 42.0, 41.0, 42.0, 40.0, 34.0, 21.0, 25.0, 18.0, 17.0, 9.0, 5.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.599751472473145, -8.346966743469238, -8.094181060791016, -7.841395854949951, -7.588610649108887, -7.335825443267822, -7.083040237426758, -6.830255508422852, -6.577469825744629, -6.3246846199035645, -6.0718994140625, -5.8191142082214355, -5.566329002380371, -5.313543796539307, -5.060758590698242, -4.807973861694336, -4.5551886558532715, -4.302403450012207, -4.049618244171143, -3.796833038330078, -3.5440478324890137, -3.291262626647949, -3.038477659225464, -2.7856924533843994, -2.532907247543335, -2.2801220417022705, -2.027336835861206, -1.7745517492294312, -1.5217665433883667, -1.2689813375473022, -1.0161962509155273, -0.7634110450744629, -0.5106258392333984, -0.25784066319465637, -0.005055487155914307, 0.24772965908050537, 0.5005148649215698, 0.7533000707626343, 1.0060851573944092, 1.2588703632354736, 1.511655569076538, 1.7644407749176025, 2.017225980758667, 2.2700109481811523, 2.522796154022217, 2.7755813598632812, 3.0283665657043457, 3.28115177154541, 3.5339369773864746, 3.786722183227539, 4.0395073890686035, 4.292292594909668, 4.545077800750732, 4.797863006591797, 5.050647735595703, 5.303433418273926, 5.556218147277832, 5.8090033531188965, 6.061788558959961, 6.314573764801025, 6.56735897064209, 6.820144176483154, 7.072929382324219, 7.325714111328125, 7.578499794006348]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 4.0, 9.0, 13.0, 11.0, 14.0, 16.0, 21.0, 23.0, 33.0, 26.0, 30.0, 30.0, 34.0, 32.0, 31.0, 42.0, 31.0, 44.0, 50.0, 36.0, 31.0, 31.0, 45.0, 40.0, 20.0, 32.0, 37.0, 29.0, 33.0, 30.0, 19.0, 19.0, 17.0, 14.0, 10.0, 11.0, 11.0, 10.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.779031753540039, -7.521757125854492, -7.264482498168945, -7.007207870483398, -6.749933242797852, -6.492658615112305, -6.235384464263916, -5.978109836578369, -5.720835208892822, -5.463560581207275, -5.2062859535217285, -4.949011325836182, -4.691737174987793, -4.434462547302246, -4.177187919616699, -3.9199132919311523, -3.6626386642456055, -3.4053640365600586, -3.1480894088745117, -2.890815019607544, -2.633540391921997, -2.37626576423645, -2.1189913749694824, -1.8617167472839355, -1.6044421195983887, -1.3471674919128418, -1.0898929834365845, -0.8326184153556824, -0.5753438472747803, -0.3180692195892334, -0.060794711112976074, 0.19647979736328125, 0.4537534713745117, 0.7110280394554138, 0.9683026075363159, 1.2255771160125732, 1.4828517436981201, 1.740126371383667, 1.9974008798599243, 2.2546753883361816, 2.5119500160217285, 2.7692246437072754, 3.0264992713928223, 3.28377366065979, 3.541048288345337, 3.798322916030884, 4.055597305297852, 4.312871932983398, 4.570146560668945, 4.827421188354492, 5.084695816040039, 5.341970443725586, 5.599245071411133, 5.85651969909668, 6.113793849945068, 6.371068477630615, 6.628343105316162, 6.885617733001709, 7.142892360687256, 7.400166988372803, 7.657441139221191, 7.914715766906738, 8.171990394592285, 8.429265022277832, 8.686539649963379]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 10.0, 17.0, 27.0, 36.0, 52.0, 77.0, 132.0, 198.0, 273.0, 426.0, 571.0, 905.0, 1411.0, 2124.0, 3312.0, 5076.0, 7914.0, 12582.0, 20255.0, 32985.0, 54434.0, 86339.0, 132015.0, 174784.0, 170599.0, 126144.0, 81552.0, 50593.0, 31354.0, 19080.0, 11909.0, 7428.0, 4755.0, 3106.0, 2065.0, 1378.0, 892.0, 572.0, 381.0, 249.0, 200.0, 125.0, 69.0, 43.0, 29.0, 25.0, 15.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0], "bins": [-1.35546875, -1.3143157958984375, -1.273162841796875, -1.2320098876953125, -1.19085693359375, -1.1497039794921875, -1.108551025390625, -1.0673980712890625, -1.0262451171875, -0.9850921630859375, -0.943939208984375, -0.9027862548828125, -0.86163330078125, -0.8204803466796875, -0.779327392578125, -0.7381744384765625, -0.697021484375, -0.6558685302734375, -0.614715576171875, -0.5735626220703125, -0.53240966796875, -0.4912567138671875, -0.450103759765625, -0.4089508056640625, -0.3677978515625, -0.3266448974609375, -0.285491943359375, -0.2443389892578125, -0.20318603515625, -0.1620330810546875, -0.120880126953125, -0.0797271728515625, -0.03857421875, 0.0025787353515625, 0.043731689453125, 0.0848846435546875, 0.12603759765625, 0.1671905517578125, 0.208343505859375, 0.2494964599609375, 0.2906494140625, 0.3318023681640625, 0.372955322265625, 0.4141082763671875, 0.45526123046875, 0.4964141845703125, 0.537567138671875, 0.5787200927734375, 0.619873046875, 0.6610260009765625, 0.702178955078125, 0.7433319091796875, 0.78448486328125, 0.8256378173828125, 0.866790771484375, 0.9079437255859375, 0.9490966796875, 0.9902496337890625, 1.031402587890625, 1.0725555419921875, 1.11370849609375, 1.1548614501953125, 1.196014404296875, 1.2371673583984375, 1.2783203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 7.0, 7.0, 17.0, 13.0, 10.0, 23.0, 32.0, 31.0, 19.0, 32.0, 29.0, 31.0, 31.0, 43.0, 31.0, 44.0, 30.0, 39.0, 44.0, 42.0, 37.0, 36.0, 29.0, 24.0, 28.0, 28.0, 46.0, 27.0, 27.0, 28.0, 19.0, 17.0, 11.0, 9.0, 16.0, 9.0, 7.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.3046875, -8.04638671875, -7.7880859375, -7.52978515625, -7.271484375, -7.01318359375, -6.7548828125, -6.49658203125, -6.23828125, -5.97998046875, -5.7216796875, -5.46337890625, -5.205078125, -4.94677734375, -4.6884765625, -4.43017578125, -4.171875, -3.91357421875, -3.6552734375, -3.39697265625, -3.138671875, -2.88037109375, -2.6220703125, -2.36376953125, -2.10546875, -1.84716796875, -1.5888671875, -1.33056640625, -1.072265625, -0.81396484375, -0.5556640625, -0.29736328125, -0.0390625, 0.21923828125, 0.4775390625, 0.73583984375, 0.994140625, 1.25244140625, 1.5107421875, 1.76904296875, 2.02734375, 2.28564453125, 2.5439453125, 2.80224609375, 3.060546875, 3.31884765625, 3.5771484375, 3.83544921875, 4.09375, 4.35205078125, 4.6103515625, 4.86865234375, 5.126953125, 5.38525390625, 5.6435546875, 5.90185546875, 6.16015625, 6.41845703125, 6.6767578125, 6.93505859375, 7.193359375, 7.45166015625, 7.7099609375, 7.96826171875, 8.2265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 13.0, 18.0, 24.0, 42.0, 56.0, 83.0, 139.0, 223.0, 357.0, 584.0, 1040.0, 1740.0, 3191.0, 5781.0, 11153.0, 23517.0, 89298.0, 756928.0, 103379.0, 25219.0, 11758.0, 6116.0, 3334.0, 1885.0, 1067.0, 585.0, 401.0, 209.0, 149.0, 91.0, 66.0, 33.0, 23.0, 18.0, 16.0, 9.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15234375, -3.0523681640625, -2.952392578125, -2.8524169921875, -2.75244140625, -2.6524658203125, -2.552490234375, -2.4525146484375, -2.3525390625, -2.2525634765625, -2.152587890625, -2.0526123046875, -1.95263671875, -1.8526611328125, -1.752685546875, -1.6527099609375, -1.552734375, -1.4527587890625, -1.352783203125, -1.2528076171875, -1.15283203125, -1.0528564453125, -0.952880859375, -0.8529052734375, -0.7529296875, -0.6529541015625, -0.552978515625, -0.4530029296875, -0.35302734375, -0.2530517578125, -0.153076171875, -0.0531005859375, 0.046875, 0.1468505859375, 0.246826171875, 0.3468017578125, 0.44677734375, 0.5467529296875, 0.646728515625, 0.7467041015625, 0.8466796875, 0.9466552734375, 1.046630859375, 1.1466064453125, 1.24658203125, 1.3465576171875, 1.446533203125, 1.5465087890625, 1.646484375, 1.7464599609375, 1.846435546875, 1.9464111328125, 2.04638671875, 2.1463623046875, 2.246337890625, 2.3463134765625, 2.4462890625, 2.5462646484375, 2.646240234375, 2.7462158203125, 2.84619140625, 2.9461669921875, 3.046142578125, 3.1461181640625, 3.24609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 7.0, 9.0, 14.0, 11.0, 23.0, 11.0, 15.0, 31.0, 27.0, 27.0, 39.0, 27.0, 28.0, 32.0, 40.0, 39.0, 41.0, 42.0, 36.0, 46.0, 36.0, 36.0, 40.0, 37.0, 37.0, 31.0, 25.0, 25.0, 21.0, 27.0, 18.0, 13.0, 14.0, 10.0, 14.0, 8.0, 12.0, 4.0, 12.0, 8.0, 2.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.69140625, -6.47784423828125, -6.2642822265625, -6.05072021484375, -5.837158203125, -5.62359619140625, -5.4100341796875, -5.19647216796875, -4.98291015625, -4.76934814453125, -4.5557861328125, -4.34222412109375, -4.128662109375, -3.91510009765625, -3.7015380859375, -3.48797607421875, -3.2744140625, -3.06085205078125, -2.8472900390625, -2.63372802734375, -2.420166015625, -2.20660400390625, -1.9930419921875, -1.77947998046875, -1.56591796875, -1.35235595703125, -1.1387939453125, -0.92523193359375, -0.711669921875, -0.49810791015625, -0.2845458984375, -0.07098388671875, 0.142578125, 0.35614013671875, 0.5697021484375, 0.78326416015625, 0.996826171875, 1.21038818359375, 1.4239501953125, 1.63751220703125, 1.85107421875, 2.06463623046875, 2.2781982421875, 2.49176025390625, 2.705322265625, 2.91888427734375, 3.1324462890625, 3.34600830078125, 3.5595703125, 3.77313232421875, 3.9866943359375, 4.20025634765625, 4.413818359375, 4.62738037109375, 4.8409423828125, 5.05450439453125, 5.26806640625, 5.48162841796875, 5.6951904296875, 5.90875244140625, 6.122314453125, 6.33587646484375, 6.5494384765625, 6.76300048828125, 6.9765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 4.0, 14.0, 11.0, 15.0, 18.0, 43.0, 50.0, 66.0, 95.0, 162.0, 222.0, 295.0, 491.0, 736.0, 1228.0, 2061.0, 3527.0, 6544.0, 12868.0, 27731.0, 221346.0, 701826.0, 35651.0, 15401.0, 7672.0, 4143.0, 2396.0, 1363.0, 910.0, 544.0, 349.0, 220.0, 157.0, 131.0, 73.0, 50.0, 35.0, 29.0, 25.0, 13.0, 8.0, 4.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.857421875, -0.8322982788085938, -0.8071746826171875, -0.7820510864257812, -0.756927490234375, -0.7318038940429688, -0.7066802978515625, -0.6815567016601562, -0.65643310546875, -0.6313095092773438, -0.6061859130859375, -0.5810623168945312, -0.555938720703125, -0.5308151245117188, -0.5056915283203125, -0.48056793212890625, -0.4554443359375, -0.43032073974609375, -0.4051971435546875, -0.38007354736328125, -0.354949951171875, -0.32982635498046875, -0.3047027587890625, -0.27957916259765625, -0.25445556640625, -0.22933197021484375, -0.2042083740234375, -0.17908477783203125, -0.153961181640625, -0.12883758544921875, -0.1037139892578125, -0.07859039306640625, -0.053466796875, -0.02834320068359375, -0.0032196044921875, 0.02190399169921875, 0.047027587890625, 0.07215118408203125, 0.0972747802734375, 0.12239837646484375, 0.14752197265625, 0.17264556884765625, 0.1977691650390625, 0.22289276123046875, 0.248016357421875, 0.27313995361328125, 0.2982635498046875, 0.32338714599609375, 0.3485107421875, 0.37363433837890625, 0.3987579345703125, 0.42388153076171875, 0.449005126953125, 0.47412872314453125, 0.4992523193359375, 0.5243759155273438, 0.54949951171875, 0.5746231079101562, 0.5997467041015625, 0.6248703002929688, 0.649993896484375, 0.6751174926757812, 0.7002410888671875, 0.7253646850585938, 0.75048828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 11.0, 6.0, 5.0, 18.0, 27.0, 30.0, 34.0, 44.0, 67.0, 65.0, 86.0, 84.0, 104.0, 76.0, 87.0, 70.0, 37.0, 46.0, 31.0, 33.0, 9.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-05, -1.7677433788776398e-05, -1.68774276971817e-05, -1.6077421605587006e-05, -1.527741551399231e-05, -1.4477409422397614e-05, -1.3677403330802917e-05, -1.2877397239208221e-05, -1.2077391147613525e-05, -1.127738505601883e-05, -1.0477378964424133e-05, -9.677372872829437e-06, -8.877366781234741e-06, -8.077360689640045e-06, -7.277354598045349e-06, -6.477348506450653e-06, -5.677342414855957e-06, -4.877336323261261e-06, -4.077330231666565e-06, -3.277324140071869e-06, -2.477318048477173e-06, -1.6773119568824768e-06, -8.773058652877808e-07, -7.729977369308472e-08, 7.227063179016113e-07, 1.5227124094963074e-06, 2.3227185010910034e-06, 3.1227245926856995e-06, 3.9227306842803955e-06, 4.7227367758750916e-06, 5.522742867469788e-06, 6.322748959064484e-06, 7.12275505065918e-06, 7.922761142253876e-06, 8.722767233848572e-06, 9.522773325443268e-06, 1.0322779417037964e-05, 1.112278550863266e-05, 1.1922791600227356e-05, 1.2722797691822052e-05, 1.3522803783416748e-05, 1.4322809875011444e-05, 1.512281596660614e-05, 1.5922822058200836e-05, 1.6722828149795532e-05, 1.7522834241390228e-05, 1.8322840332984924e-05, 1.912284642457962e-05, 1.9922852516174316e-05, 2.0722858607769012e-05, 2.152286469936371e-05, 2.2322870790958405e-05, 2.31228768825531e-05, 2.3922882974147797e-05, 2.4722889065742493e-05, 2.552289515733719e-05, 2.6322901248931885e-05, 2.712290734052658e-05, 2.7922913432121277e-05, 2.8722919523715973e-05, 2.952292561531067e-05, 3.0322931706905365e-05, 3.112293779850006e-05, 3.192294389009476e-05, 3.272294998168945e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 7.0, 6.0, 9.0, 19.0, 22.0, 24.0, 35.0, 59.0, 77.0, 113.0, 175.0, 242.0, 436.0, 710.0, 1199.0, 1907.0, 3267.0, 5658.0, 9552.0, 16944.0, 29261.0, 52663.0, 97722.0, 187496.0, 263144.0, 172489.0, 91162.0, 48913.0, 27415.0, 15647.0, 8944.0, 5313.0, 3167.0, 1844.0, 1114.0, 669.0, 406.0, 267.0, 156.0, 105.0, 61.0, 44.0, 40.0, 16.0, 18.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6142578125, -0.5940780639648438, -0.5738983154296875, -0.5537185668945312, -0.533538818359375, -0.5133590698242188, -0.4931793212890625, -0.47299957275390625, -0.45281982421875, -0.43264007568359375, -0.4124603271484375, -0.39228057861328125, -0.372100830078125, -0.35192108154296875, -0.3317413330078125, -0.31156158447265625, -0.2913818359375, -0.27120208740234375, -0.2510223388671875, -0.23084259033203125, -0.210662841796875, -0.19048309326171875, -0.1703033447265625, -0.15012359619140625, -0.12994384765625, -0.10976409912109375, -0.0895843505859375, -0.06940460205078125, -0.049224853515625, -0.02904510498046875, -0.0088653564453125, 0.01131439208984375, 0.031494140625, 0.05167388916015625, 0.0718536376953125, 0.09203338623046875, 0.112213134765625, 0.13239288330078125, 0.1525726318359375, 0.17275238037109375, 0.19293212890625, 0.21311187744140625, 0.2332916259765625, 0.25347137451171875, 0.273651123046875, 0.29383087158203125, 0.3140106201171875, 0.33419036865234375, 0.3543701171875, 0.37454986572265625, 0.3947296142578125, 0.41490936279296875, 0.435089111328125, 0.45526885986328125, 0.4754486083984375, 0.49562835693359375, 0.51580810546875, 0.5359878540039062, 0.5561676025390625, 0.5763473510742188, 0.596527099609375, 0.6167068481445312, 0.6368865966796875, 0.6570663452148438, 0.67724609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 4.0, 7.0, 10.0, 9.0, 11.0, 7.0, 14.0, 17.0, 19.0, 20.0, 34.0, 24.0, 35.0, 41.0, 41.0, 55.0, 61.0, 52.0, 60.0, 55.0, 56.0, 60.0, 63.0, 31.0, 25.0, 32.0, 26.0, 25.0, 10.0, 19.0, 12.0, 12.0, 9.0, 13.0, 6.0, 7.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.29296875, -0.2825736999511719, -0.27217864990234375, -0.2617835998535156, -0.2513885498046875, -0.24099349975585938, -0.23059844970703125, -0.22020339965820312, -0.209808349609375, -0.19941329956054688, -0.18901824951171875, -0.17862319946289062, -0.1682281494140625, -0.15783309936523438, -0.14743804931640625, -0.13704299926757812, -0.12664794921875, -0.11625289916992188, -0.10585784912109375, -0.09546279907226562, -0.0850677490234375, -0.07467269897460938, -0.06427764892578125, -0.053882598876953125, -0.043487548828125, -0.033092498779296875, -0.02269744873046875, -0.012302398681640625, -0.0019073486328125, 0.008487701416015625, 0.01888275146484375, 0.029277801513671875, 0.0396728515625, 0.050067901611328125, 0.06046295166015625, 0.07085800170898438, 0.0812530517578125, 0.09164810180664062, 0.10204315185546875, 0.11243820190429688, 0.122833251953125, 0.13322830200195312, 0.14362335205078125, 0.15401840209960938, 0.1644134521484375, 0.17480850219726562, 0.18520355224609375, 0.19559860229492188, 0.20599365234375, 0.21638870239257812, 0.22678375244140625, 0.23717880249023438, 0.2475738525390625, 0.2579689025878906, 0.26836395263671875, 0.2787590026855469, 0.289154052734375, 0.2995491027832031, 0.30994415283203125, 0.3203392028808594, 0.3307342529296875, 0.3411293029785156, 0.35152435302734375, 0.3619194030761719, 0.372314453125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 8.0, 9.0, 8.0, 16.0, 14.0, 6.0, 13.0, 21.0, 23.0, 33.0, 31.0, 32.0, 29.0, 45.0, 47.0, 46.0, 54.0, 44.0, 51.0, 41.0, 38.0, 47.0, 44.0, 29.0, 51.0, 39.0, 29.0, 33.0, 20.0, 26.0, 14.0, 7.0, 9.0, 8.0, 4.0, 9.0, 2.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.28689956665039, -8.044787406921387, -7.802674293518066, -7.5605621337890625, -7.3184494972229, -7.076336860656738, -6.834224700927734, -6.592112064361572, -6.34999942779541, -6.107886791229248, -5.865774154663086, -5.623661994934082, -5.38154935836792, -5.139436721801758, -4.897324562072754, -4.655211925506592, -4.41309928894043, -4.170986652374268, -3.9288742542266846, -3.6867618560791016, -3.4446492195129395, -3.2025365829467773, -2.9604241847991943, -2.7183117866516113, -2.476199150085449, -2.234086513519287, -1.991974115371704, -1.7498615980148315, -1.507749080657959, -1.2656365633010864, -1.0235240459442139, -0.7814115285873413, -0.5392990112304688, -0.2971864938735962, -0.05507397651672363, 0.18703854084014893, 0.4291510581970215, 0.671263575553894, 0.9133760929107666, 1.1554886102676392, 1.3976011276245117, 1.6397136449813843, 1.8818261623382568, 2.12393856048584, 2.366051197052002, 2.608163833618164, 2.850276231765747, 3.09238862991333, 3.334501266479492, 3.5766139030456543, 3.8187263011932373, 4.06083869934082, 4.302951335906982, 4.5450639724731445, 4.787176132202148, 5.0292887687683105, 5.271401405334473, 5.513514041900635, 5.755626678466797, 5.997738838195801, 6.239851474761963, 6.481964111328125, 6.724076271057129, 6.966188907623291, 7.208301544189453]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 9.0, 10.0, 15.0, 14.0, 17.0, 28.0, 32.0, 25.0, 28.0, 33.0, 35.0, 31.0, 25.0, 38.0, 34.0, 41.0, 43.0, 47.0, 37.0, 32.0, 50.0, 39.0, 20.0, 26.0, 41.0, 28.0, 41.0, 28.0, 18.0, 16.0, 19.0, 11.0, 13.0, 15.0, 9.0, 11.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.911843776702881, -7.651417255401611, -7.390990734100342, -7.130564212799072, -6.870138168334961, -6.609711647033691, -6.349285125732422, -6.088858604431152, -5.828432083129883, -5.568005561828613, -5.307579040527344, -5.047152519226074, -4.786725997924805, -4.526299476623535, -4.265873432159424, -4.005446910858154, -3.7450203895568848, -3.4845938682556152, -3.2241673469543457, -2.9637410640716553, -2.7033145427703857, -2.442888021469116, -2.182461738586426, -1.9220352172851562, -1.6616086959838867, -1.4011821746826172, -1.1407557725906372, -0.8803293108940125, -0.6199028491973877, -0.35947632789611816, -0.09904992580413818, 0.1613764762878418, 0.42180347442626953, 0.6822299361228943, 0.942656397819519, 1.203082799911499, 1.4635093212127686, 1.723935842514038, 1.984362244606018, 2.244788646697998, 2.5052151679992676, 2.765641689300537, 3.0260682106018066, 3.286494493484497, 3.5469210147857666, 3.807347536087036, 4.067773818969727, 4.328200340270996, 4.588626861572266, 4.849053382873535, 5.109479904174805, 5.369906425476074, 5.630332946777344, 5.890759468078613, 6.151185512542725, 6.411612033843994, 6.672038555145264, 6.932465076446533, 7.192891597747803, 7.453318119049072, 7.713744163513184, 7.974170684814453, 8.234597206115723, 8.495023727416992, 8.755450248718262]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 6.0, 6.0, 6.0, 17.0, 21.0, 20.0, 42.0, 46.0, 78.0, 117.0, 161.0, 270.0, 377.0, 592.0, 888.0, 1313.0, 2007.0, 3015.0, 4736.0, 7151.0, 10875.0, 16255.0, 24611.0, 36684.0, 53369.0, 73847.0, 96407.0, 114978.0, 123342.0, 117598.0, 101476.0, 79312.0, 58102.0, 40322.0, 27090.0, 18241.0, 11871.0, 8228.0, 5121.0, 3389.0, 2218.0, 1490.0, 943.0, 629.0, 405.0, 282.0, 192.0, 145.0, 86.0, 59.0, 46.0, 35.0, 13.0, 14.0, 4.0, 7.0, 7.0, 2.0, 0.0, 3.0, 2.0], "bins": [-5.5703125, -5.3941650390625, -5.218017578125, -5.0418701171875, -4.86572265625, -4.6895751953125, -4.513427734375, -4.3372802734375, -4.1611328125, -3.9849853515625, -3.808837890625, -3.6326904296875, -3.45654296875, -3.2803955078125, -3.104248046875, -2.9281005859375, -2.751953125, -2.5758056640625, -2.399658203125, -2.2235107421875, -2.04736328125, -1.8712158203125, -1.695068359375, -1.5189208984375, -1.3427734375, -1.1666259765625, -0.990478515625, -0.8143310546875, -0.63818359375, -0.4620361328125, -0.285888671875, -0.1097412109375, 0.06640625, 0.2425537109375, 0.418701171875, 0.5948486328125, 0.77099609375, 0.9471435546875, 1.123291015625, 1.2994384765625, 1.4755859375, 1.6517333984375, 1.827880859375, 2.0040283203125, 2.18017578125, 2.3563232421875, 2.532470703125, 2.7086181640625, 2.884765625, 3.0609130859375, 3.237060546875, 3.4132080078125, 3.58935546875, 3.7655029296875, 3.941650390625, 4.1177978515625, 4.2939453125, 4.4700927734375, 4.646240234375, 4.8223876953125, 4.99853515625, 5.1746826171875, 5.350830078125, 5.5269775390625, 5.703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 6.0, 12.0, 7.0, 15.0, 16.0, 18.0, 29.0, 33.0, 30.0, 32.0, 24.0, 36.0, 36.0, 29.0, 44.0, 44.0, 31.0, 42.0, 48.0, 38.0, 45.0, 32.0, 38.0, 36.0, 38.0, 40.0, 21.0, 30.0, 29.0, 20.0, 18.0, 15.0, 14.0, 8.0, 5.0, 7.0, 9.0, 12.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.8203125, -8.5611572265625, -8.302001953125, -8.0428466796875, -7.78369140625, -7.5245361328125, -7.265380859375, -7.0062255859375, -6.7470703125, -6.4879150390625, -6.228759765625, -5.9696044921875, -5.71044921875, -5.4512939453125, -5.192138671875, -4.9329833984375, -4.673828125, -4.4146728515625, -4.155517578125, -3.8963623046875, -3.63720703125, -3.3780517578125, -3.118896484375, -2.8597412109375, -2.6005859375, -2.3414306640625, -2.082275390625, -1.8231201171875, -1.56396484375, -1.3048095703125, -1.045654296875, -0.7864990234375, -0.52734375, -0.2681884765625, -0.009033203125, 0.2501220703125, 0.50927734375, 0.7684326171875, 1.027587890625, 1.2867431640625, 1.5458984375, 1.8050537109375, 2.064208984375, 2.3233642578125, 2.58251953125, 2.8416748046875, 3.100830078125, 3.3599853515625, 3.619140625, 3.8782958984375, 4.137451171875, 4.3966064453125, 4.65576171875, 4.9149169921875, 5.174072265625, 5.4332275390625, 5.6923828125, 5.9515380859375, 6.210693359375, 6.4698486328125, 6.72900390625, 6.9881591796875, 7.247314453125, 7.5064697265625, 7.765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 12.0, 11.0, 24.0, 39.0, 46.0, 76.0, 101.0, 123.0, 230.0, 370.0, 545.0, 997.0, 1580.0, 2622.0, 4391.0, 7403.0, 12581.0, 21607.0, 35855.0, 57803.0, 88674.0, 123963.0, 150744.0, 153864.0, 130128.0, 94928.0, 63148.0, 39163.0, 23408.0, 13670.0, 8167.0, 4800.0, 2810.0, 1705.0, 1123.0, 686.0, 432.0, 255.0, 167.0, 99.0, 62.0, 63.0, 29.0, 17.0, 16.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.4453125, -8.19757080078125, -7.9498291015625, -7.70208740234375, -7.454345703125, -7.20660400390625, -6.9588623046875, -6.71112060546875, -6.46337890625, -6.21563720703125, -5.9678955078125, -5.72015380859375, -5.472412109375, -5.22467041015625, -4.9769287109375, -4.72918701171875, -4.4814453125, -4.23370361328125, -3.9859619140625, -3.73822021484375, -3.490478515625, -3.24273681640625, -2.9949951171875, -2.74725341796875, -2.49951171875, -2.25177001953125, -2.0040283203125, -1.75628662109375, -1.508544921875, -1.26080322265625, -1.0130615234375, -0.76531982421875, -0.517578125, -0.26983642578125, -0.0220947265625, 0.22564697265625, 0.473388671875, 0.72113037109375, 0.9688720703125, 1.21661376953125, 1.46435546875, 1.71209716796875, 1.9598388671875, 2.20758056640625, 2.455322265625, 2.70306396484375, 2.9508056640625, 3.19854736328125, 3.4462890625, 3.69403076171875, 3.9417724609375, 4.18951416015625, 4.437255859375, 4.68499755859375, 4.9327392578125, 5.18048095703125, 5.42822265625, 5.67596435546875, 5.9237060546875, 6.17144775390625, 6.419189453125, 6.66693115234375, 6.9146728515625, 7.16241455078125, 7.41015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 1.0, 6.0, 1.0, 4.0, 9.0, 7.0, 11.0, 10.0, 13.0, 15.0, 14.0, 19.0, 26.0, 25.0, 31.0, 32.0, 34.0, 37.0, 41.0, 41.0, 52.0, 38.0, 42.0, 52.0, 43.0, 40.0, 36.0, 28.0, 26.0, 31.0, 36.0, 26.0, 21.0, 23.0, 18.0, 22.0, 13.0, 8.0, 7.0, 12.0, 10.0, 13.0, 10.0, 6.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.8046875, -4.638427734375, -4.47216796875, -4.305908203125, -4.1396484375, -3.973388671875, -3.80712890625, -3.640869140625, -3.474609375, -3.308349609375, -3.14208984375, -2.975830078125, -2.8095703125, -2.643310546875, -2.47705078125, -2.310791015625, -2.14453125, -1.978271484375, -1.81201171875, -1.645751953125, -1.4794921875, -1.313232421875, -1.14697265625, -0.980712890625, -0.814453125, -0.648193359375, -0.48193359375, -0.315673828125, -0.1494140625, 0.016845703125, 0.18310546875, 0.349365234375, 0.515625, 0.681884765625, 0.84814453125, 1.014404296875, 1.1806640625, 1.346923828125, 1.51318359375, 1.679443359375, 1.845703125, 2.011962890625, 2.17822265625, 2.344482421875, 2.5107421875, 2.677001953125, 2.84326171875, 3.009521484375, 3.17578125, 3.342041015625, 3.50830078125, 3.674560546875, 3.8408203125, 4.007080078125, 4.17333984375, 4.339599609375, 4.505859375, 4.672119140625, 4.83837890625, 5.004638671875, 5.1708984375, 5.337158203125, 5.50341796875, 5.669677734375, 5.8359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 7.0, 12.0, 12.0, 20.0, 42.0, 63.0, 88.0, 137.0, 201.0, 295.0, 493.0, 834.0, 1343.0, 2284.0, 4229.0, 8644.0, 18983.0, 44819.0, 102743.0, 197753.0, 259940.0, 206504.0, 110354.0, 48404.0, 20425.0, 9174.0, 4518.0, 2441.0, 1415.0, 836.0, 518.0, 364.0, 232.0, 146.0, 106.0, 54.0, 47.0, 26.0, 16.0, 18.0, 12.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.3629150390625, -5.175048828125, -4.9871826171875, -4.79931640625, -4.6114501953125, -4.423583984375, -4.2357177734375, -4.0478515625, -3.8599853515625, -3.672119140625, -3.4842529296875, -3.29638671875, -3.1085205078125, -2.920654296875, -2.7327880859375, -2.544921875, -2.3570556640625, -2.169189453125, -1.9813232421875, -1.79345703125, -1.6055908203125, -1.417724609375, -1.2298583984375, -1.0419921875, -0.8541259765625, -0.666259765625, -0.4783935546875, -0.29052734375, -0.1026611328125, 0.085205078125, 0.2730712890625, 0.4609375, 0.6488037109375, 0.836669921875, 1.0245361328125, 1.21240234375, 1.4002685546875, 1.588134765625, 1.7760009765625, 1.9638671875, 2.1517333984375, 2.339599609375, 2.5274658203125, 2.71533203125, 2.9031982421875, 3.091064453125, 3.2789306640625, 3.466796875, 3.6546630859375, 3.842529296875, 4.0303955078125, 4.21826171875, 4.4061279296875, 4.593994140625, 4.7818603515625, 4.9697265625, 5.1575927734375, 5.345458984375, 5.5333251953125, 5.72119140625, 5.9090576171875, 6.096923828125, 6.2847900390625, 6.47265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 5.0, 4.0, 8.0, 11.0, 28.0, 23.0, 44.0, 53.0, 74.0, 81.0, 106.0, 107.0, 110.0, 94.0, 101.0, 54.0, 30.0, 18.0, 22.0, 9.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000545501708984375, -0.0005222409963607788, -0.0004989802837371826, -0.0004757195711135864, -0.00045245885848999023, -0.00042919814586639404, -0.00040593743324279785, -0.00038267672061920166, -0.00035941600799560547, -0.0003361552953720093, -0.0003128945827484131, -0.0002896338701248169, -0.0002663731575012207, -0.0002431124448776245, -0.00021985173225402832, -0.00019659101963043213, -0.00017333030700683594, -0.00015006959438323975, -0.00012680888175964355, -0.00010354816913604736, -8.028745651245117e-05, -5.702674388885498e-05, -3.376603126525879e-05, -1.0505318641662598e-05, 1.2755393981933594e-05, 3.6016106605529785e-05, 5.9276819229125977e-05, 8.253753185272217e-05, 0.00010579824447631836, 0.00012905895709991455, 0.00015231966972351074, 0.00017558038234710693, 0.00019884109497070312, 0.00022210180759429932, 0.0002453625202178955, 0.0002686232328414917, 0.0002918839454650879, 0.0003151446580886841, 0.0003384053707122803, 0.00036166608333587646, 0.00038492679595947266, 0.00040818750858306885, 0.00043144822120666504, 0.00045470893383026123, 0.0004779696464538574, 0.0005012303590774536, 0.0005244910717010498, 0.000547751784324646, 0.0005710124969482422, 0.0005942732095718384, 0.0006175339221954346, 0.0006407946348190308, 0.000664055347442627, 0.0006873160600662231, 0.0007105767726898193, 0.0007338374853134155, 0.0007570981979370117, 0.0007803589105606079, 0.0008036196231842041, 0.0008268803358078003, 0.0008501410484313965, 0.0008734017610549927, 0.0008966624736785889, 0.0009199231863021851, 0.0009431838989257812]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 13.0, 21.0, 20.0, 31.0, 43.0, 57.0, 100.0, 130.0, 207.0, 384.0, 605.0, 863.0, 1461.0, 2466.0, 4571.0, 9039.0, 19875.0, 47866.0, 112181.0, 214690.0, 268953.0, 194192.0, 95825.0, 40065.0, 17102.0, 7866.0, 4040.0, 2203.0, 1369.0, 855.0, 493.0, 329.0, 192.0, 147.0, 106.0, 50.0, 41.0, 20.0, 22.0, 13.0, 11.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.515625, -6.320556640625, -6.12548828125, -5.930419921875, -5.7353515625, -5.540283203125, -5.34521484375, -5.150146484375, -4.955078125, -4.760009765625, -4.56494140625, -4.369873046875, -4.1748046875, -3.979736328125, -3.78466796875, -3.589599609375, -3.39453125, -3.199462890625, -3.00439453125, -2.809326171875, -2.6142578125, -2.419189453125, -2.22412109375, -2.029052734375, -1.833984375, -1.638916015625, -1.44384765625, -1.248779296875, -1.0537109375, -0.858642578125, -0.66357421875, -0.468505859375, -0.2734375, -0.078369140625, 0.11669921875, 0.311767578125, 0.5068359375, 0.701904296875, 0.89697265625, 1.092041015625, 1.287109375, 1.482177734375, 1.67724609375, 1.872314453125, 2.0673828125, 2.262451171875, 2.45751953125, 2.652587890625, 2.84765625, 3.042724609375, 3.23779296875, 3.432861328125, 3.6279296875, 3.822998046875, 4.01806640625, 4.213134765625, 4.408203125, 4.603271484375, 4.79833984375, 4.993408203125, 5.1884765625, 5.383544921875, 5.57861328125, 5.773681640625, 5.96875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 12.0, 9.0, 18.0, 28.0, 38.0, 48.0, 59.0, 75.0, 66.0, 79.0, 86.0, 82.0, 75.0, 54.0, 70.0, 48.0, 27.0, 22.0, 23.0, 26.0, 15.0, 10.0, 9.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.830078125, -1.7685546875, -1.70703125, -1.6455078125, -1.583984375, -1.5224609375, -1.4609375, -1.3994140625, -1.337890625, -1.2763671875, -1.21484375, -1.1533203125, -1.091796875, -1.0302734375, -0.96875, -0.9072265625, -0.845703125, -0.7841796875, -0.72265625, -0.6611328125, -0.599609375, -0.5380859375, -0.4765625, -0.4150390625, -0.353515625, -0.2919921875, -0.23046875, -0.1689453125, -0.107421875, -0.0458984375, 0.015625, 0.0771484375, 0.138671875, 0.2001953125, 0.26171875, 0.3232421875, 0.384765625, 0.4462890625, 0.5078125, 0.5693359375, 0.630859375, 0.6923828125, 0.75390625, 0.8154296875, 0.876953125, 0.9384765625, 1.0, 1.0615234375, 1.123046875, 1.1845703125, 1.24609375, 1.3076171875, 1.369140625, 1.4306640625, 1.4921875, 1.5537109375, 1.615234375, 1.6767578125, 1.73828125, 1.7998046875, 1.861328125, 1.9228515625, 1.984375, 2.0458984375, 2.107421875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 7.0, 0.0, 1.0, 5.0, 3.0, 9.0, 10.0, 15.0, 12.0, 15.0, 19.0, 23.0, 29.0, 36.0, 41.0, 39.0, 36.0, 43.0, 47.0, 48.0, 60.0, 64.0, 52.0, 65.0, 47.0, 29.0, 25.0, 43.0, 40.0, 34.0, 18.0, 19.0, 16.0, 15.0, 8.0, 9.0, 7.0, 3.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.115504264831543, -9.833325386047363, -9.551146507263184, -9.268966674804688, -8.986787796020508, -8.704608917236328, -8.422430038452148, -8.140251159667969, -7.858072280883789, -7.575893402099609, -7.2937140464782715, -7.011535167694092, -6.729356288909912, -6.447176933288574, -6.1649980545043945, -5.882819175720215, -5.600639820098877, -5.318460941314697, -5.036281585693359, -4.75410270690918, -4.471923828125, -4.18974494934082, -3.9075655937194824, -3.6253867149353027, -3.343207597732544, -3.061028480529785, -2.7788496017456055, -2.4966704845428467, -2.214491367340088, -1.9323124885559082, -1.6501333713531494, -1.3679543733596802, -1.0857748985290527, -0.8035959005355835, -0.5214168429374695, -0.23923778533935547, 0.04294121265411377, 0.325120210647583, 0.6072993278503418, 0.889478325843811, 1.1716573238372803, 1.4538363218307495, 1.7360153198242188, 2.0181944370269775, 2.3003735542297363, 2.582552433013916, 2.864731550216675, 3.1469106674194336, 3.4290895462036133, 3.711268663406372, 3.9934475421905518, 4.2756266593933105, 4.55780553817749, 4.839984893798828, 5.122163772583008, 5.4043426513671875, 5.686521530151367, 5.968700408935547, 6.250879764556885, 6.5330586433410645, 6.815237522125244, 7.097416877746582, 7.379595756530762, 7.661774635314941, 7.943953990936279]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 6.0, 5.0, 11.0, 9.0, 7.0, 19.0, 11.0, 18.0, 14.0, 20.0, 25.0, 29.0, 26.0, 33.0, 40.0, 40.0, 41.0, 49.0, 48.0, 33.0, 42.0, 51.0, 32.0, 43.0, 33.0, 34.0, 39.0, 24.0, 30.0, 24.0, 16.0, 24.0, 26.0, 20.0, 11.0, 16.0, 7.0, 7.0, 6.0, 4.0, 7.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-10.622222900390625, -10.303954124450684, -9.985684394836426, -9.667415618896484, -9.349146842956543, -9.030878067016602, -8.712608337402344, -8.394339561462402, -8.076070785522461, -7.757801532745361, -7.43953275680542, -7.12126350402832, -6.802994728088379, -6.484725475311279, -6.16645622253418, -5.848187446594238, -5.5299177169799805, -5.211648464202881, -4.8933796882629395, -4.57511043548584, -4.256841659545898, -3.938572406768799, -3.620303153991699, -3.3020341396331787, -2.983765125274658, -2.6654961109161377, -2.347227096557617, -2.0289578437805176, -1.710688829421997, -1.3924198150634766, -1.0741506814956665, -0.7558815479278564, -0.43761157989501953, -0.11934250593185425, 0.19892656803131104, 0.5171956419944763, 0.8354647159576416, 1.153733730316162, 1.4720028638839722, 1.7902719974517822, 2.1085410118103027, 2.4268100261688232, 2.7450790405273438, 3.0633482933044434, 3.381617307662964, 3.6998863220214844, 4.018155574798584, 4.336424827575684, 4.654693603515625, 4.972962856292725, 5.291231632232666, 5.609500885009766, 5.927769660949707, 6.246038913726807, 6.564308166503906, 6.882576942443848, 7.200846195220947, 7.519115447998047, 7.837384223937988, 8.15565299987793, 8.473922729492188, 8.792191505432129, 9.11046028137207, 9.428730010986328, 9.74699878692627]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 5.0, 4.0, 11.0, 5.0, 7.0, 11.0, 18.0, 19.0, 20.0, 29.0, 38.0, 50.0, 72.0, 134.0, 212.0, 331.0, 556.0, 829.0, 1384.0, 2474.0, 5028.0, 16539.0, 1011331.0, 5206.0, 2516.0, 1397.0, 860.0, 545.0, 304.0, 207.0, 142.0, 95.0, 66.0, 33.0, 23.0, 18.0, 19.0, 14.0, 10.0, 10.0, 7.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-131.32412719726562, -126.94771575927734, -122.5713119506836, -118.19490051269531, -113.81849670410156, -109.44208526611328, -105.065673828125, -100.68927001953125, -96.3128662109375, -91.93645477294922, -87.56005096435547, -83.18363952636719, -78.80723571777344, -74.43082427978516, -70.05441284179688, -65.67800903320312, -61.301597595214844, -56.92518997192383, -52.54878234863281, -48.17237091064453, -43.79596710205078, -39.4195556640625, -35.043148040771484, -30.66674041748047, -26.290332794189453, -21.913925170898438, -17.537517547607422, -13.161108016967773, -8.784700393676758, -4.408292770385742, -0.03188323974609375, 4.344524383544922, 8.720932006835938, 13.097339630126953, 17.47374725341797, 21.850156784057617, 26.226564407348633, 30.60297203063965, 34.9793815612793, 39.35578918457031, 43.73219680786133, 48.108604431152344, 52.48501205444336, 56.861419677734375, 61.237831115722656, 65.6142349243164, 69.99064636230469, 74.36705017089844, 78.74346160888672, 83.119873046875, 87.49627685546875, 91.87268829345703, 96.24909210205078, 100.62550354003906, 105.00190734863281, 109.3783187866211, 113.75473022460938, 118.13114166259766, 122.5075454711914, 126.88395690917969, 131.26036071777344, 135.6367645263672, 140.01318359375, 144.38958740234375, 148.7659912109375]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 13.0, 9.0, 12.0, 18.0, 16.0, 37.0, 50.0, 67.0, 116.0, 153.0, 248.0, 463.0, 719.0, 1208.0, 1888.0, 2974.0, 4782.0, 8096.0, 21343.0, 51366200.0, 38539.0, 9941.0, 5233.0, 3467.0, 2145.0, 1351.0, 839.0, 504.0, 301.0, 192.0, 123.0, 92.0, 51.0, 43.0, 36.0, 18.0, 9.0, 14.0, 13.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-113.14997100830078, -109.19941711425781, -105.24885559082031, -101.29830169677734, -97.34774780273438, -93.39718627929688, -89.4466323852539, -85.49607849121094, -81.54551696777344, -77.59496307373047, -73.64440155029297, -69.69384765625, -65.7432861328125, -61.79273223876953, -57.84217834472656, -53.89162063598633, -49.941062927246094, -45.99050521850586, -42.039947509765625, -38.089393615722656, -34.13883590698242, -30.188278198242188, -26.237722396850586, -22.287166595458984, -18.33660888671875, -14.386052131652832, -10.435495376586914, -6.484938621520996, -2.534381866455078, 1.4161758422851562, 5.366731643676758, 9.31728744506836, 13.267837524414062, 17.218395233154297, 21.1689510345459, 25.1195068359375, 29.070064544677734, 33.02062225341797, 36.97117614746094, 40.92173385620117, 44.872291564941406, 48.82284927368164, 52.773406982421875, 56.723960876464844, 60.67451858520508, 64.62507629394531, 68.57563018798828, 72.52618408203125, 76.47674560546875, 80.42729949951172, 84.37786102294922, 88.32841491699219, 92.27897644042969, 96.22953033447266, 100.18008422851562, 104.13064575195312, 108.0811996459961, 112.03175354003906, 115.98231506347656, 119.93286895751953, 123.8834228515625, 127.833984375, 131.7845458984375, 135.73509216308594, 139.68565368652344]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 3.0, 13.0, 14.0, 18.0, 19.0, 28.0, 31.0, 25.0, 50.0, 71.0, 55.0, 72.0, 68.0, 77.0, 56.0, 69.0, 68.0, 46.0, 40.0, 27.0, 31.0, 9.0, 15.0, 14.0, 12.0, 13.0, 8.0, 6.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-130.62277221679688, -126.44393920898438, -122.26510620117188, -118.08627319335938, -113.90743255615234, -109.72859954833984, -105.54976654052734, -101.37093353271484, -97.19209289550781, -93.01325988769531, -88.83442687988281, -84.65559387207031, -80.47675323486328, -76.29792022705078, -72.11908721923828, -67.94025421142578, -63.76142120361328, -59.58258819580078, -55.403751373291016, -51.224918365478516, -47.04608154296875, -42.86724853515625, -38.68841552734375, -34.50958251953125, -30.330745697021484, -26.15191078186035, -21.97307586669922, -17.79424285888672, -13.615407943725586, -9.436573028564453, -5.257740020751953, -1.0789051055908203, 3.0999298095703125, 7.278764247894287, 11.457598686218262, 15.636432647705078, 19.81526756286621, 23.994102478027344, 28.172935485839844, 32.351768493652344, 36.53060531616211, 40.70943832397461, 44.888275146484375, 49.067108154296875, 53.245941162109375, 57.42477798461914, 61.60361099243164, 65.7824478149414, 69.9612808227539, 74.1401138305664, 78.3189468383789, 82.49778747558594, 86.67662048339844, 90.85545349121094, 95.03428649902344, 99.21311950683594, 103.39195251464844, 107.57078552246094, 111.74961853027344, 115.92845153808594, 120.10729217529297, 124.28612518310547, 128.4649658203125, 132.643798828125, 136.8226318359375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 11.0, 8.0, 12.0, 13.0, 14.0, 14.0, 29.0, 19.0, 26.0, 30.0, 37.0, 37.0, 53.0, 55.0, 57.0, 71.0, 64.0, 52.0, 49.0, 43.0, 34.0, 37.0, 28.0, 27.0, 22.0, 21.0, 23.0, 13.0, 11.0, 17.0, 14.0, 8.0, 4.0, 2.0, 5.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.7757110595703, -140.26004028320312, -135.74435424804688, -131.2286834716797, -126.71299743652344, -122.19732666015625, -117.68164825439453, -113.16596984863281, -108.6502914428711, -104.13461303710938, -99.61893463134766, -95.10325622558594, -90.58758544921875, -86.0718994140625, -81.55622863769531, -77.0405502319336, -72.52487182617188, -68.00919342041016, -63.49351501464844, -58.977840423583984, -54.462162017822266, -49.94648361206055, -45.430809020996094, -40.915130615234375, -36.399452209472656, -31.883773803710938, -27.36809730529785, -22.852420806884766, -18.336742401123047, -13.821063995361328, -9.305387496948242, -4.789710998535156, -0.2740478515625, 4.241629600524902, 8.757307052612305, 13.272984504699707, 17.78866195678711, 22.304340362548828, 26.820016860961914, 31.335693359375, 35.85137176513672, 40.36705017089844, 44.882728576660156, 49.39840316772461, 53.91408157348633, 58.42975997924805, 62.9454345703125, 67.46111297607422, 71.97679138183594, 76.49246978759766, 81.00814819335938, 85.5238265991211, 90.03950500488281, 94.55517578125, 99.07085418701172, 103.58653259277344, 108.10221099853516, 112.61788940429688, 117.1335678100586, 121.64924621582031, 126.1649169921875, 130.68060302734375, 135.19627380371094, 139.71194458007812, 144.22763061523438]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 15.0, 22.0, 16.0, 32.0, 71.0, 92.0, 140.0, 257.0, 419.0, 659.0, 1108.0, 1924.0, 3391.0, 6147.0, 11855.0, 24531.0, 55762.0, 143592.0, 417088.0, 1674789.0, 1274088.0, 363072.0, 123912.0, 47740.0, 20563.0, 10091.0, 5250.0, 2989.0, 1684.0, 1104.0, 658.0, 402.0, 277.0, 178.0, 107.0, 81.0, 54.0, 36.0, 32.0, 11.0, 8.0, 6.0, 10.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.33984375, -2.264190673828125, -2.18853759765625, -2.112884521484375, -2.0372314453125, -1.961578369140625, -1.88592529296875, -1.810272216796875, -1.734619140625, -1.658966064453125, -1.58331298828125, -1.507659912109375, -1.4320068359375, -1.356353759765625, -1.28070068359375, -1.205047607421875, -1.12939453125, -1.053741455078125, -0.97808837890625, -0.902435302734375, -0.8267822265625, -0.751129150390625, -0.67547607421875, -0.599822998046875, -0.524169921875, -0.448516845703125, -0.37286376953125, -0.297210693359375, -0.2215576171875, -0.145904541015625, -0.07025146484375, 0.005401611328125, 0.0810546875, 0.156707763671875, 0.23236083984375, 0.308013916015625, 0.3836669921875, 0.459320068359375, 0.53497314453125, 0.610626220703125, 0.686279296875, 0.761932373046875, 0.83758544921875, 0.913238525390625, 0.9888916015625, 1.064544677734375, 1.14019775390625, 1.215850830078125, 1.29150390625, 1.367156982421875, 1.44281005859375, 1.518463134765625, 1.5941162109375, 1.669769287109375, 1.74542236328125, 1.821075439453125, 1.896728515625, 1.972381591796875, 2.04803466796875, 2.123687744140625, 2.1993408203125, 2.274993896484375, 2.35064697265625, 2.426300048828125, 2.501953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 2.0, 5.0, 14.0, 11.0, 13.0, 31.0, 29.0, 53.0, 50.0, 85.0, 67.0, 71.0, 82.0, 90.0, 70.0, 73.0, 70.0, 57.0, 28.0, 25.0, 16.0, 14.0, 14.0, 4.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2809257507324219, -0.27108001708984375, -0.2612342834472656, -0.2513885498046875, -0.24154281616210938, -0.23169708251953125, -0.22185134887695312, -0.212005615234375, -0.20215988159179688, -0.19231414794921875, -0.18246841430664062, -0.1726226806640625, -0.16277694702148438, -0.15293121337890625, -0.14308547973632812, -0.13323974609375, -0.12339401245117188, -0.11354827880859375, -0.10370254516601562, -0.0938568115234375, -0.08401107788085938, -0.07416534423828125, -0.06431961059570312, -0.054473876953125, -0.044628143310546875, -0.03478240966796875, -0.024936676025390625, -0.0150909423828125, -0.005245208740234375, 0.00460052490234375, 0.014446258544921875, 0.0242919921875, 0.034137725830078125, 0.04398345947265625, 0.053829193115234375, 0.0636749267578125, 0.07352066040039062, 0.08336639404296875, 0.09321212768554688, 0.103057861328125, 0.11290359497070312, 0.12274932861328125, 0.13259506225585938, 0.1424407958984375, 0.15228652954101562, 0.16213226318359375, 0.17197799682617188, 0.18182373046875, 0.19166946411132812, 0.20151519775390625, 0.21136093139648438, 0.2212066650390625, 0.23105239868164062, 0.24089813232421875, 0.2507438659667969, 0.260589599609375, 0.2704353332519531, 0.28028106689453125, 0.2901268005371094, 0.2999725341796875, 0.3098182678222656, 0.31966400146484375, 0.3295097351074219, 0.33935546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 17.0, 15.0, 25.0, 29.0, 56.0, 90.0, 132.0, 235.0, 348.0, 567.0, 927.0, 1479.0, 2594.0, 4429.0, 8135.0, 15102.0, 29275.0, 60968.0, 135390.0, 324810.0, 859988.0, 1607601.0, 665498.0, 259202.0, 111285.0, 50569.0, 25183.0, 13259.0, 7179.0, 3948.0, 2392.0, 1428.0, 780.0, 507.0, 307.0, 175.0, 126.0, 70.0, 48.0, 40.0, 22.0, 13.0, 10.0, 8.0, 8.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.77734375, -1.724090576171875, -1.67083740234375, -1.617584228515625, -1.5643310546875, -1.511077880859375, -1.45782470703125, -1.404571533203125, -1.351318359375, -1.298065185546875, -1.24481201171875, -1.191558837890625, -1.1383056640625, -1.085052490234375, -1.03179931640625, -0.978546142578125, -0.92529296875, -0.872039794921875, -0.81878662109375, -0.765533447265625, -0.7122802734375, -0.659027099609375, -0.60577392578125, -0.552520751953125, -0.499267578125, -0.446014404296875, -0.39276123046875, -0.339508056640625, -0.2862548828125, -0.233001708984375, -0.17974853515625, -0.126495361328125, -0.0732421875, -0.019989013671875, 0.03326416015625, 0.086517333984375, 0.1397705078125, 0.193023681640625, 0.24627685546875, 0.299530029296875, 0.352783203125, 0.406036376953125, 0.45928955078125, 0.512542724609375, 0.5657958984375, 0.619049072265625, 0.67230224609375, 0.725555419921875, 0.77880859375, 0.832061767578125, 0.88531494140625, 0.938568115234375, 0.9918212890625, 1.045074462890625, 1.09832763671875, 1.151580810546875, 1.204833984375, 1.258087158203125, 1.31134033203125, 1.364593505859375, 1.4178466796875, 1.471099853515625, 1.52435302734375, 1.577606201171875, 1.630859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 8.0, 11.0, 13.0, 13.0, 26.0, 30.0, 31.0, 36.0, 60.0, 59.0, 77.0, 86.0, 141.0, 163.0, 187.0, 230.0, 284.0, 306.0, 417.0, 319.0, 245.0, 234.0, 192.0, 169.0, 141.0, 106.0, 81.0, 64.0, 59.0, 60.0, 48.0, 36.0, 31.0, 29.0, 19.0, 11.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.475830078125, -0.4586982727050781, -0.44156646728515625, -0.4244346618652344, -0.4073028564453125, -0.3901710510253906, -0.37303924560546875, -0.3559074401855469, -0.338775634765625, -0.3216438293457031, -0.30451202392578125, -0.2873802185058594, -0.2702484130859375, -0.2531166076660156, -0.23598480224609375, -0.21885299682617188, -0.20172119140625, -0.18458938598632812, -0.16745758056640625, -0.15032577514648438, -0.1331939697265625, -0.11606216430664062, -0.09893035888671875, -0.08179855346679688, -0.064666748046875, -0.047534942626953125, -0.03040313720703125, -0.013271331787109375, 0.0038604736328125, 0.020992279052734375, 0.03812408447265625, 0.055255889892578125, 0.0723876953125, 0.08951950073242188, 0.10665130615234375, 0.12378311157226562, 0.1409149169921875, 0.15804672241210938, 0.17517852783203125, 0.19231033325195312, 0.209442138671875, 0.22657394409179688, 0.24370574951171875, 0.2608375549316406, 0.2779693603515625, 0.2951011657714844, 0.31223297119140625, 0.3293647766113281, 0.34649658203125, 0.3636283874511719, 0.38076019287109375, 0.3978919982910156, 0.4150238037109375, 0.4321556091308594, 0.44928741455078125, 0.4664192199707031, 0.483551025390625, 0.5006828308105469, 0.5178146362304688, 0.5349464416503906, 0.5520782470703125, 0.5692100524902344, 0.5863418579101562, 0.6034736633300781, 0.62060546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 12.0, 14.0, 43.0, 127.0, 242.0, 263.0, 165.0, 77.0, 45.0, 11.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09284210205078, -18.481613159179688, -17.870384216308594, -17.2591552734375, -16.647926330566406, -16.036697387695312, -15.425467491149902, -14.814237594604492, -14.203008651733398, -13.591779708862305, -12.980550765991211, -12.369321823120117, -11.758091926574707, -11.146862983703613, -10.53563404083252, -9.92440414428711, -9.313176155090332, -8.701947212219238, -8.090718269348145, -7.479488849639893, -6.868259429931641, -6.257030487060547, -5.645801544189453, -5.034572124481201, -4.423343181610107, -3.8121140003204346, -3.2008848190307617, -2.589655876159668, -1.9784266948699951, -1.3671975135803223, -0.7559685707092285, -0.14473915100097656, 0.4664897918701172, 1.07771897315979, 1.6889480352401733, 2.3001770973205566, 2.9114062786102295, 3.5226354598999023, 4.133864402770996, 4.745093822479248, 5.356322765350342, 5.9675517082214355, 6.5787811279296875, 7.190010070800781, 7.801239013671875, 8.412467956542969, 9.023696899414062, 9.634926795959473, 10.246155738830566, 10.85738468170166, 11.468613624572754, 12.079843521118164, 12.691072463989258, 13.302301406860352, 13.913530349731445, 14.524759292602539, 15.135988235473633, 15.747217178344727, 16.35844612121582, 16.969675064086914, 17.580904006958008, 18.192134857177734, 18.803363800048828, 19.414592742919922, 20.025821685791016]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 4.0, 8.0, 6.0, 6.0, 6.0, 10.0, 11.0, 16.0, 17.0, 18.0, 36.0, 19.0, 30.0, 33.0, 35.0, 35.0, 33.0, 48.0, 44.0, 36.0, 36.0, 39.0, 41.0, 37.0, 41.0, 46.0, 45.0, 43.0, 27.0, 26.0, 27.0, 19.0, 17.0, 25.0, 22.0, 10.0, 10.0, 6.0, 10.0, 11.0, 5.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.173708915710449, -3.0636112689971924, -2.9535136222839355, -2.843416213989258, -2.733318567276001, -2.623220920562744, -2.5131232738494873, -2.4030256271362305, -2.2929279804229736, -2.182830333709717, -2.07273268699646, -1.9626351594924927, -1.8525375127792358, -1.7424399852752686, -1.6323423385620117, -1.5222446918487549, -1.4121471643447876, -1.3020495176315308, -1.1919519901275635, -1.0818543434143066, -0.9717566967010498, -0.8616591095924377, -0.7515615224838257, -0.6414638757705688, -0.5313662886619568, -0.42126867175102234, -0.3111710548400879, -0.20107346773147583, -0.09097585082054138, 0.019121766090393066, 0.12921935319900513, 0.23931699991226196, 0.349414587020874, 0.45951220393180847, 0.5696098208427429, 0.679707407951355, 0.7898050546646118, 0.8999026417732239, 1.010000228881836, 1.1200978755950928, 1.2301955223083496, 1.3402931690216064, 1.4503906965255737, 1.5604883432388306, 1.6705859899520874, 1.7806835174560547, 1.8907811641693115, 2.0008788108825684, 2.110976219177246, 2.221073865890503, 2.3311715126037598, 2.4412689208984375, 2.5513665676116943, 2.661464214324951, 2.771561861038208, 2.881659507751465, 2.9917571544647217, 3.1018548011779785, 3.2119524478912354, 3.322050094604492, 3.43214750289917, 3.5422451496124268, 3.6523427963256836, 3.7624404430389404, 3.8725380897521973]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 7.0, 8.0, 7.0, 14.0, 16.0, 17.0, 24.0, 37.0, 48.0, 69.0, 106.0, 149.0, 192.0, 338.0, 521.0, 793.0, 1355.0, 2347.0, 4177.0, 7772.0, 15920.0, 33862.0, 77291.0, 176422.0, 300265.0, 230434.0, 106573.0, 45892.0, 21028.0, 10283.0, 5198.0, 2817.0, 1701.0, 1009.0, 628.0, 393.0, 276.0, 179.0, 123.0, 95.0, 48.0, 37.0, 26.0, 17.0, 14.0, 8.0, 7.0, 2.0, 10.0, 6.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.990234375, -0.955718994140625, -0.92120361328125, -0.886688232421875, -0.8521728515625, -0.817657470703125, -0.78314208984375, -0.748626708984375, -0.714111328125, -0.679595947265625, -0.64508056640625, -0.610565185546875, -0.5760498046875, -0.541534423828125, -0.50701904296875, -0.472503662109375, -0.43798828125, -0.403472900390625, -0.36895751953125, -0.334442138671875, -0.2999267578125, -0.265411376953125, -0.23089599609375, -0.196380615234375, -0.161865234375, -0.127349853515625, -0.09283447265625, -0.058319091796875, -0.0238037109375, 0.010711669921875, 0.04522705078125, 0.079742431640625, 0.1142578125, 0.148773193359375, 0.18328857421875, 0.217803955078125, 0.2523193359375, 0.286834716796875, 0.32135009765625, 0.355865478515625, 0.390380859375, 0.424896240234375, 0.45941162109375, 0.493927001953125, 0.5284423828125, 0.562957763671875, 0.59747314453125, 0.631988525390625, 0.66650390625, 0.701019287109375, 0.73553466796875, 0.770050048828125, 0.8045654296875, 0.839080810546875, 0.87359619140625, 0.908111572265625, 0.942626953125, 0.977142333984375, 1.01165771484375, 1.046173095703125, 1.0806884765625, 1.115203857421875, 1.14971923828125, 1.184234619140625, 1.21875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 11.0, 3.0, 8.0, 17.0, 13.0, 25.0, 33.0, 31.0, 43.0, 53.0, 58.0, 69.0, 62.0, 70.0, 61.0, 58.0, 65.0, 57.0, 49.0, 38.0, 43.0, 25.0, 21.0, 13.0, 19.0, 14.0, 5.0, 8.0, 6.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.292724609375, -0.28383636474609375, -0.2749481201171875, -0.26605987548828125, -0.257171630859375, -0.24828338623046875, -0.2393951416015625, -0.23050689697265625, -0.22161865234375, -0.21273040771484375, -0.2038421630859375, -0.19495391845703125, -0.186065673828125, -0.17717742919921875, -0.1682891845703125, -0.15940093994140625, -0.1505126953125, -0.14162445068359375, -0.1327362060546875, -0.12384796142578125, -0.114959716796875, -0.10607147216796875, -0.0971832275390625, -0.08829498291015625, -0.07940673828125, -0.07051849365234375, -0.0616302490234375, -0.05274200439453125, -0.043853759765625, -0.03496551513671875, -0.0260772705078125, -0.01718902587890625, -0.00830078125, 0.00058746337890625, 0.0094757080078125, 0.01836395263671875, 0.027252197265625, 0.03614044189453125, 0.0450286865234375, 0.05391693115234375, 0.06280517578125, 0.07169342041015625, 0.0805816650390625, 0.08946990966796875, 0.098358154296875, 0.10724639892578125, 0.1161346435546875, 0.12502288818359375, 0.1339111328125, 0.14279937744140625, 0.1516876220703125, 0.16057586669921875, 0.169464111328125, 0.17835235595703125, 0.1872406005859375, 0.19612884521484375, 0.20501708984375, 0.21390533447265625, 0.2227935791015625, 0.23168182373046875, 0.240570068359375, 0.24945831298828125, 0.2583465576171875, 0.26723480224609375, 0.276123046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 10.0, 15.0, 16.0, 43.0, 75.0, 181.0, 381.0, 929.0, 2474.0, 7183.0, 27341.0, 165612.0, 665785.0, 143346.0, 24659.0, 6666.0, 2295.0, 841.0, 362.0, 149.0, 70.0, 45.0, 16.0, 13.0, 8.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.140625, -3.04949951171875, -2.9583740234375, -2.86724853515625, -2.776123046875, -2.68499755859375, -2.5938720703125, -2.50274658203125, -2.41162109375, -2.32049560546875, -2.2293701171875, -2.13824462890625, -2.047119140625, -1.95599365234375, -1.8648681640625, -1.77374267578125, -1.6826171875, -1.59149169921875, -1.5003662109375, -1.40924072265625, -1.318115234375, -1.22698974609375, -1.1358642578125, -1.04473876953125, -0.95361328125, -0.86248779296875, -0.7713623046875, -0.68023681640625, -0.589111328125, -0.49798583984375, -0.4068603515625, -0.31573486328125, -0.224609375, -0.13348388671875, -0.0423583984375, 0.04876708984375, 0.139892578125, 0.23101806640625, 0.3221435546875, 0.41326904296875, 0.50439453125, 0.59552001953125, 0.6866455078125, 0.77777099609375, 0.868896484375, 0.96002197265625, 1.0511474609375, 1.14227294921875, 1.2333984375, 1.32452392578125, 1.4156494140625, 1.50677490234375, 1.597900390625, 1.68902587890625, 1.7801513671875, 1.87127685546875, 1.96240234375, 2.05352783203125, 2.1446533203125, 2.23577880859375, 2.326904296875, 2.41802978515625, 2.5091552734375, 2.60028076171875, 2.69140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 8.0, 9.0, 5.0, 7.0, 14.0, 14.0, 23.0, 13.0, 24.0, 28.0, 28.0, 30.0, 39.0, 36.0, 47.0, 49.0, 55.0, 52.0, 37.0, 48.0, 41.0, 40.0, 34.0, 44.0, 36.0, 32.0, 29.0, 26.0, 26.0, 23.0, 28.0, 15.0, 14.0, 9.0, 10.0, 6.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.49609375, -1.44732666015625, -1.3985595703125, -1.34979248046875, -1.301025390625, -1.25225830078125, -1.2034912109375, -1.15472412109375, -1.10595703125, -1.05718994140625, -1.0084228515625, -0.95965576171875, -0.910888671875, -0.86212158203125, -0.8133544921875, -0.76458740234375, -0.7158203125, -0.66705322265625, -0.6182861328125, -0.56951904296875, -0.520751953125, -0.47198486328125, -0.4232177734375, -0.37445068359375, -0.32568359375, -0.27691650390625, -0.2281494140625, -0.17938232421875, -0.130615234375, -0.08184814453125, -0.0330810546875, 0.01568603515625, 0.064453125, 0.11322021484375, 0.1619873046875, 0.21075439453125, 0.259521484375, 0.30828857421875, 0.3570556640625, 0.40582275390625, 0.45458984375, 0.50335693359375, 0.5521240234375, 0.60089111328125, 0.649658203125, 0.69842529296875, 0.7471923828125, 0.79595947265625, 0.8447265625, 0.89349365234375, 0.9422607421875, 0.99102783203125, 1.039794921875, 1.08856201171875, 1.1373291015625, 1.18609619140625, 1.23486328125, 1.28363037109375, 1.3323974609375, 1.38116455078125, 1.429931640625, 1.47869873046875, 1.5274658203125, 1.57623291015625, 1.625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 10.0, 18.0, 16.0, 16.0, 42.0, 79.0, 120.0, 223.0, 502.0, 1279.0, 4349.0, 32491.0, 935417.0, 65171.0, 6177.0, 1515.0, 569.0, 241.0, 134.0, 77.0, 40.0, 23.0, 10.0, 12.0, 11.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.78125, -13.414794921875, -13.04833984375, -12.681884765625, -12.3154296875, -11.948974609375, -11.58251953125, -11.216064453125, -10.849609375, -10.483154296875, -10.11669921875, -9.750244140625, -9.3837890625, -9.017333984375, -8.65087890625, -8.284423828125, -7.91796875, -7.551513671875, -7.18505859375, -6.818603515625, -6.4521484375, -6.085693359375, -5.71923828125, -5.352783203125, -4.986328125, -4.619873046875, -4.25341796875, -3.886962890625, -3.5205078125, -3.154052734375, -2.78759765625, -2.421142578125, -2.0546875, -1.688232421875, -1.32177734375, -0.955322265625, -0.5888671875, -0.222412109375, 0.14404296875, 0.510498046875, 0.876953125, 1.243408203125, 1.60986328125, 1.976318359375, 2.3427734375, 2.709228515625, 3.07568359375, 3.442138671875, 3.80859375, 4.175048828125, 4.54150390625, 4.907958984375, 5.2744140625, 5.640869140625, 6.00732421875, 6.373779296875, 6.740234375, 7.106689453125, 7.47314453125, 7.839599609375, 8.2060546875, 8.572509765625, 8.93896484375, 9.305419921875, 9.671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 7.0, 9.0, 22.0, 33.0, 36.0, 69.0, 85.0, 114.0, 120.0, 121.0, 98.0, 80.0, 62.0, 44.0, 28.0, 28.0, 5.0, 13.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002532005310058594, -0.0002441592514514923, -0.00023511797189712524, -0.00022607669234275818, -0.0002170354127883911, -0.00020799413323402405, -0.00019895285367965698, -0.00018991157412528992, -0.00018087029457092285, -0.00017182901501655579, -0.00016278773546218872, -0.00015374645590782166, -0.0001447051763534546, -0.00013566389679908752, -0.00012662261724472046, -0.0001175813376903534, -0.00010854005813598633, -9.949877858161926e-05, -9.04574990272522e-05, -8.141621947288513e-05, -7.237493991851807e-05, -6.3333660364151e-05, -5.4292380809783936e-05, -4.525110125541687e-05, -3.6209821701049805e-05, -2.716854214668274e-05, -1.8127262592315674e-05, -9.085983037948608e-06, -4.470348358154297e-08, 8.996576070785522e-06, 1.8037855625152588e-05, 2.7079135179519653e-05, 3.612041473388672e-05, 4.5161694288253784e-05, 5.420297384262085e-05, 6.324425339698792e-05, 7.228553295135498e-05, 8.132681250572205e-05, 9.036809206008911e-05, 9.940937161445618e-05, 0.00010845065116882324, 0.00011749193072319031, 0.00012653321027755737, 0.00013557448983192444, 0.0001446157693862915, 0.00015365704894065857, 0.00016269832849502563, 0.0001717396080493927, 0.00018078088760375977, 0.00018982216715812683, 0.0001988634467124939, 0.00020790472626686096, 0.00021694600582122803, 0.0002259872853755951, 0.00023502856492996216, 0.00024406984448432922, 0.0002531111240386963, 0.00026215240359306335, 0.0002711936831474304, 0.0002802349627017975, 0.00028927624225616455, 0.0002983175218105316, 0.0003073588013648987, 0.00031640008091926575, 0.0003254413604736328]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 12.0, 16.0, 25.0, 44.0, 64.0, 117.0, 181.0, 266.0, 430.0, 752.0, 1374.0, 2664.0, 5917.0, 14957.0, 55251.0, 632500.0, 278318.0, 35016.0, 11124.0, 4613.0, 2140.0, 1117.0, 657.0, 373.0, 226.0, 156.0, 88.0, 48.0, 37.0, 20.0, 17.0, 13.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.04296875, -5.86956787109375, -5.6961669921875, -5.52276611328125, -5.349365234375, -5.17596435546875, -5.0025634765625, -4.82916259765625, -4.65576171875, -4.48236083984375, -4.3089599609375, -4.13555908203125, -3.962158203125, -3.78875732421875, -3.6153564453125, -3.44195556640625, -3.2685546875, -3.09515380859375, -2.9217529296875, -2.74835205078125, -2.574951171875, -2.40155029296875, -2.2281494140625, -2.05474853515625, -1.88134765625, -1.70794677734375, -1.5345458984375, -1.36114501953125, -1.187744140625, -1.01434326171875, -0.8409423828125, -0.66754150390625, -0.494140625, -0.32073974609375, -0.1473388671875, 0.02606201171875, 0.199462890625, 0.37286376953125, 0.5462646484375, 0.71966552734375, 0.89306640625, 1.06646728515625, 1.2398681640625, 1.41326904296875, 1.586669921875, 1.76007080078125, 1.9334716796875, 2.10687255859375, 2.2802734375, 2.45367431640625, 2.6270751953125, 2.80047607421875, 2.973876953125, 3.14727783203125, 3.3206787109375, 3.49407958984375, 3.66748046875, 3.84088134765625, 4.0142822265625, 4.18768310546875, 4.361083984375, 4.53448486328125, 4.7078857421875, 4.88128662109375, 5.0546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 6.0, 9.0, 16.0, 10.0, 11.0, 17.0, 30.0, 38.0, 34.0, 75.0, 89.0, 77.0, 118.0, 105.0, 85.0, 75.0, 50.0, 33.0, 32.0, 23.0, 10.0, 8.0, 9.0, 13.0, 9.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1875, -2.1181640625, -2.048828125, -1.9794921875, -1.91015625, -1.8408203125, -1.771484375, -1.7021484375, -1.6328125, -1.5634765625, -1.494140625, -1.4248046875, -1.35546875, -1.2861328125, -1.216796875, -1.1474609375, -1.078125, -1.0087890625, -0.939453125, -0.8701171875, -0.80078125, -0.7314453125, -0.662109375, -0.5927734375, -0.5234375, -0.4541015625, -0.384765625, -0.3154296875, -0.24609375, -0.1767578125, -0.107421875, -0.0380859375, 0.03125, 0.1005859375, 0.169921875, 0.2392578125, 0.30859375, 0.3779296875, 0.447265625, 0.5166015625, 0.5859375, 0.6552734375, 0.724609375, 0.7939453125, 0.86328125, 0.9326171875, 1.001953125, 1.0712890625, 1.140625, 1.2099609375, 1.279296875, 1.3486328125, 1.41796875, 1.4873046875, 1.556640625, 1.6259765625, 1.6953125, 1.7646484375, 1.833984375, 1.9033203125, 1.97265625, 2.0419921875, 2.111328125, 2.1806640625, 2.25]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 7.0, 15.0, 18.0, 28.0, 57.0, 122.0, 174.0, 223.0, 174.0, 90.0, 46.0, 21.0, 13.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.267791748046875, -30.20023536682129, -29.13267707824707, -28.065120697021484, -26.997562408447266, -25.93000602722168, -24.862449645996094, -23.794891357421875, -22.727333068847656, -21.65977668762207, -20.59221839904785, -19.524662017822266, -18.457103729248047, -17.38954734802246, -16.321990966796875, -15.254432678222656, -14.18687629699707, -13.119318962097168, -12.051761627197266, -10.98420524597168, -9.916646957397461, -8.849090576171875, -7.781533241271973, -6.71397590637207, -5.646418571472168, -4.578861236572266, -3.5113041400909424, -2.443747043609619, -1.3761897087097168, -0.30863237380981445, 0.7589244842529297, 1.826481819152832, 2.8940391540527344, 3.9615964889526367, 5.029153823852539, 6.096710681915283, 7.1642680168151855, 8.23182487487793, 9.299382209777832, 10.366939544677734, 11.434496879577637, 12.502054214477539, 13.569611549377441, 14.637168884277344, 15.70472526550293, 16.77228355407715, 17.839839935302734, 18.907398223876953, 19.97495460510254, 21.042510986328125, 22.110069274902344, 23.17762565612793, 24.24518394470215, 25.312740325927734, 26.380298614501953, 27.44785499572754, 28.515411376953125, 29.58296775817871, 30.65052604675293, 31.718082427978516, 32.785640716552734, 33.85319900512695, 34.920753479003906, 35.988311767578125, 37.055870056152344]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 3.0, 8.0, 7.0, 12.0, 17.0, 24.0, 25.0, 50.0, 86.0, 91.0, 93.0, 94.0, 107.0, 96.0, 85.0, 47.0, 37.0, 26.0, 10.0, 12.0, 12.0, 10.0, 7.0, 5.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.50630760192871, -19.790912628173828, -19.075519561767578, -18.360124588012695, -17.644731521606445, -16.929336547851562, -16.213943481445312, -15.49854850769043, -14.783154487609863, -14.067760467529297, -13.35236644744873, -12.636972427368164, -11.921577453613281, -11.206184387207031, -10.490789413452148, -9.775395393371582, -9.060001373291016, -8.34460735321045, -7.629213333129883, -6.913818836212158, -6.198424816131592, -5.483030796051025, -4.767636299133301, -4.052242279052734, -3.336848258972168, -2.6214542388916016, -1.906059980392456, -1.1906657218933105, -0.47527170181274414, 0.24012231826782227, 0.9555168151855469, 1.6709108352661133, 2.3863048553466797, 3.101698875427246, 3.8170931339263916, 4.532487392425537, 5.2478814125061035, 5.96327543258667, 6.6786699295043945, 7.394063949584961, 8.109457969665527, 8.824851989746094, 9.54024600982666, 10.255640029907227, 10.97103500366211, 11.68642807006836, 12.401823043823242, 13.117217063903809, 13.832611083984375, 14.548005104064941, 15.263399124145508, 15.97879409790039, 16.69418716430664, 17.409582138061523, 18.124977111816406, 18.840370178222656, 19.555763244628906, 20.27115821838379, 20.98655128479004, 21.701946258544922, 22.417339324951172, 23.132734298706055, 23.848129272460938, 24.563522338867188, 25.27891731262207]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 4.0, 16.0, 22.0, 25.0, 57.0, 78.0, 116.0, 204.0, 337.0, 536.0, 932.0, 1784.0, 3532.0, 7374.0, 17486.0, 46305.0, 151086.0, 1174617.0, 2519289.0, 181008.0, 53114.0, 19495.0, 8201.0, 3830.0, 2011.0, 1077.0, 632.0, 392.0, 244.0, 137.0, 100.0, 76.0, 32.0, 31.0, 31.0, 15.0, 8.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.716217041015625, -3.57891845703125, -3.441619873046875, -3.3043212890625, -3.167022705078125, -3.02972412109375, -2.892425537109375, -2.755126953125, -2.617828369140625, -2.48052978515625, -2.343231201171875, -2.2059326171875, -2.068634033203125, -1.93133544921875, -1.794036865234375, -1.65673828125, -1.519439697265625, -1.38214111328125, -1.244842529296875, -1.1075439453125, -0.970245361328125, -0.83294677734375, -0.695648193359375, -0.558349609375, -0.421051025390625, -0.28375244140625, -0.146453857421875, -0.0091552734375, 0.128143310546875, 0.26544189453125, 0.402740478515625, 0.5400390625, 0.677337646484375, 0.81463623046875, 0.951934814453125, 1.0892333984375, 1.226531982421875, 1.36383056640625, 1.501129150390625, 1.638427734375, 1.775726318359375, 1.91302490234375, 2.050323486328125, 2.1876220703125, 2.324920654296875, 2.46221923828125, 2.599517822265625, 2.73681640625, 2.874114990234375, 3.01141357421875, 3.148712158203125, 3.2860107421875, 3.423309326171875, 3.56060791015625, 3.697906494140625, 3.835205078125, 3.972503662109375, 4.10980224609375, 4.247100830078125, 4.3843994140625, 4.521697998046875, 4.65899658203125, 4.796295166015625, 4.93359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 3.0, 9.0, 7.0, 10.0, 14.0, 14.0, 22.0, 24.0, 39.0, 45.0, 40.0, 41.0, 52.0, 53.0, 62.0, 62.0, 55.0, 53.0, 58.0, 49.0, 61.0, 37.0, 39.0, 29.0, 22.0, 23.0, 14.0, 14.0, 7.0, 7.0, 5.0, 4.0, 5.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.2315540313720703, -0.22323989868164062, -0.21492576599121094, -0.20661163330078125, -0.19829750061035156, -0.18998336791992188, -0.1816692352294922, -0.1733551025390625, -0.1650409698486328, -0.15672683715820312, -0.14841270446777344, -0.14009857177734375, -0.13178443908691406, -0.12347030639648438, -0.11515617370605469, -0.106842041015625, -0.09852790832519531, -0.09021377563476562, -0.08189964294433594, -0.07358551025390625, -0.06527137756347656, -0.056957244873046875, -0.04864311218261719, -0.0403289794921875, -0.03201484680175781, -0.023700714111328125, -0.015386581420898438, -0.00707244873046875, 0.0012416839599609375, 0.009555816650390625, 0.017869949340820312, 0.02618408203125, 0.03449821472167969, 0.042812347412109375, 0.05112648010253906, 0.05944061279296875, 0.06775474548339844, 0.07606887817382812, 0.08438301086425781, 0.0926971435546875, 0.10101127624511719, 0.10932540893554688, 0.11763954162597656, 0.12595367431640625, 0.13426780700683594, 0.14258193969726562, 0.1508960723876953, 0.159210205078125, 0.1675243377685547, 0.17583847045898438, 0.18415260314941406, 0.19246673583984375, 0.20078086853027344, 0.20909500122070312, 0.2174091339111328, 0.2257232666015625, 0.2340373992919922, 0.24235153198242188, 0.25066566467285156, 0.25897979736328125, 0.26729393005371094, 0.2756080627441406, 0.2839221954345703, 0.292236328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 7.0, 11.0, 16.0, 18.0, 29.0, 39.0, 76.0, 105.0, 167.0, 279.0, 446.0, 735.0, 1323.0, 2346.0, 4134.0, 8010.0, 17075.0, 39976.0, 110996.0, 463916.0, 2947069.0, 423137.0, 103517.0, 37535.0, 16293.0, 7769.0, 3892.0, 2130.0, 1284.0, 745.0, 434.0, 240.0, 185.0, 116.0, 76.0, 52.0, 36.0, 18.0, 9.0, 11.0, 9.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.8984375, -3.7705078125, -3.642578125, -3.5146484375, -3.38671875, -3.2587890625, -3.130859375, -3.0029296875, -2.875, -2.7470703125, -2.619140625, -2.4912109375, -2.36328125, -2.2353515625, -2.107421875, -1.9794921875, -1.8515625, -1.7236328125, -1.595703125, -1.4677734375, -1.33984375, -1.2119140625, -1.083984375, -0.9560546875, -0.828125, -0.7001953125, -0.572265625, -0.4443359375, -0.31640625, -0.1884765625, -0.060546875, 0.0673828125, 0.1953125, 0.3232421875, 0.451171875, 0.5791015625, 0.70703125, 0.8349609375, 0.962890625, 1.0908203125, 1.21875, 1.3466796875, 1.474609375, 1.6025390625, 1.73046875, 1.8583984375, 1.986328125, 2.1142578125, 2.2421875, 2.3701171875, 2.498046875, 2.6259765625, 2.75390625, 2.8818359375, 3.009765625, 3.1376953125, 3.265625, 3.3935546875, 3.521484375, 3.6494140625, 3.77734375, 3.9052734375, 4.033203125, 4.1611328125, 4.2890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 6.0, 6.0, 10.0, 15.0, 12.0, 21.0, 33.0, 45.0, 50.0, 86.0, 106.0, 140.0, 218.0, 406.0, 1282.0, 677.0, 292.0, 212.0, 130.0, 90.0, 58.0, 48.0, 31.0, 24.0, 18.0, 16.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.68408203125, -0.6625442504882812, -0.6410064697265625, -0.6194686889648438, -0.597930908203125, -0.5763931274414062, -0.5548553466796875, -0.5333175659179688, -0.51177978515625, -0.49024200439453125, -0.4687042236328125, -0.44716644287109375, -0.425628662109375, -0.40409088134765625, -0.3825531005859375, -0.36101531982421875, -0.3394775390625, -0.31793975830078125, -0.2964019775390625, -0.27486419677734375, -0.253326416015625, -0.23178863525390625, -0.2102508544921875, -0.18871307373046875, -0.16717529296875, -0.14563751220703125, -0.1240997314453125, -0.10256195068359375, -0.081024169921875, -0.05948638916015625, -0.0379486083984375, -0.01641082763671875, 0.005126953125, 0.02666473388671875, 0.0482025146484375, 0.06974029541015625, 0.091278076171875, 0.11281585693359375, 0.1343536376953125, 0.15589141845703125, 0.17742919921875, 0.19896697998046875, 0.2205047607421875, 0.24204254150390625, 0.263580322265625, 0.28511810302734375, 0.3066558837890625, 0.32819366455078125, 0.3497314453125, 0.37126922607421875, 0.3928070068359375, 0.41434478759765625, 0.435882568359375, 0.45742034912109375, 0.4789581298828125, 0.5004959106445312, 0.52203369140625, 0.5435714721679688, 0.5651092529296875, 0.5866470336914062, 0.608184814453125, 0.6297225952148438, 0.6512603759765625, 0.6727981567382812, 0.6943359375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 8.0, 29.0, 167.0, 401.0, 296.0, 72.0, 16.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.709792137145996, -13.154809951782227, -12.599828720092773, -12.044846534729004, -11.48986530303955, -10.934883117675781, -10.379901885986328, -9.824919700622559, -9.269937515258789, -8.71495532989502, -8.159974098205566, -7.604991912841797, -7.050010681152344, -6.495028495788574, -5.940046787261963, -5.385065078735352, -4.830083847045898, -4.275102138519287, -3.720120429992676, -3.1651384830474854, -2.610156774520874, -2.0551750659942627, -1.5001931190490723, -0.9452114105224609, -0.3902297019958496, 0.1647520661354065, 0.7197338342666626, 1.2747156620025635, 1.8296973705291748, 2.384679079055786, 2.9396610260009766, 3.494642734527588, 4.049625396728516, 4.604607105255127, 5.159588813781738, 5.714570999145508, 6.269552230834961, 6.8245344161987305, 7.379516124725342, 7.934497833251953, 8.489479064941406, 9.044461250305176, 9.599442481994629, 10.154424667358398, 10.709405899047852, 11.264388084411621, 11.81937026977539, 12.374351501464844, 12.929333686828613, 13.484315872192383, 14.039297103881836, 14.594279289245605, 15.149260520935059, 15.704242706298828, 16.25922393798828, 16.814205169677734, 17.36918830871582, 17.924169540405273, 18.47915267944336, 19.034133911132812, 19.589115142822266, 20.14409637451172, 20.699079513549805, 21.254060745239258, 21.80904197692871]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 14.0, 15.0, 10.0, 17.0, 19.0, 39.0, 47.0, 49.0, 43.0, 69.0, 70.0, 62.0, 71.0, 63.0, 68.0, 57.0, 50.0, 54.0, 40.0, 31.0, 23.0, 18.0, 10.0, 17.0, 4.0, 8.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.3601903915405273, -3.2557363510131836, -3.1512820720672607, -3.046828031539917, -2.942373752593994, -2.8379197120666504, -2.7334656715393066, -2.629011631011963, -2.52455735206604, -2.4201033115386963, -2.3156490325927734, -2.2111949920654297, -2.106740951538086, -2.002286672592163, -1.8978326320648193, -1.793378472328186, -1.6889243125915527, -1.5844701528549194, -1.4800159931182861, -1.3755619525909424, -1.271107792854309, -1.1666536331176758, -1.062199592590332, -0.9577454328536987, -0.8532912731170654, -0.7488371133804321, -0.6443830132484436, -0.5399289131164551, -0.4354747533798218, -0.3310205936431885, -0.22656649351119995, -0.12211239337921143, -0.017658233642578125, 0.08679589629173279, 0.1912500262260437, 0.2957041561603546, 0.4001582860946655, 0.5046124458312988, 0.6090665459632874, 0.7135206460952759, 0.8179748058319092, 0.9224289655685425, 1.0268831253051758, 1.1313371658325195, 1.2357913255691528, 1.3402454853057861, 1.4446995258331299, 1.5491536855697632, 1.6536078453063965, 1.7580620050430298, 1.862516164779663, 1.9669702053070068, 2.0714244842529297, 2.1758785247802734, 2.280332565307617, 2.384786605834961, 2.489240884780884, 2.5936949253082275, 2.6981492042541504, 2.802603244781494, 2.907057285308838, 3.0115115642547607, 3.1159656047821045, 3.2204198837280273, 3.324873924255371]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0, 5.0, 8.0, 13.0, 8.0, 21.0, 35.0, 40.0, 81.0, 112.0, 219.0, 464.0, 872.0, 1978.0, 4720.0, 12617.0, 38275.0, 134927.0, 393339.0, 319915.0, 96235.0, 28276.0, 9429.0, 3722.0, 1683.0, 735.0, 360.0, 176.0, 111.0, 64.0, 32.0, 21.0, 21.0, 10.0, 5.0, 7.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.255859375, -3.1468505859375, -3.037841796875, -2.9288330078125, -2.81982421875, -2.7108154296875, -2.601806640625, -2.4927978515625, -2.3837890625, -2.2747802734375, -2.165771484375, -2.0567626953125, -1.94775390625, -1.8387451171875, -1.729736328125, -1.6207275390625, -1.51171875, -1.4027099609375, -1.293701171875, -1.1846923828125, -1.07568359375, -0.9666748046875, -0.857666015625, -0.7486572265625, -0.6396484375, -0.5306396484375, -0.421630859375, -0.3126220703125, -0.20361328125, -0.0946044921875, 0.014404296875, 0.1234130859375, 0.232421875, 0.3414306640625, 0.450439453125, 0.5594482421875, 0.66845703125, 0.7774658203125, 0.886474609375, 0.9954833984375, 1.1044921875, 1.2135009765625, 1.322509765625, 1.4315185546875, 1.54052734375, 1.6495361328125, 1.758544921875, 1.8675537109375, 1.9765625, 2.0855712890625, 2.194580078125, 2.3035888671875, 2.41259765625, 2.5216064453125, 2.630615234375, 2.7396240234375, 2.8486328125, 2.9576416015625, 3.066650390625, 3.1756591796875, 3.28466796875, 3.3936767578125, 3.502685546875, 3.6116943359375, 3.720703125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 0.0, 5.0, 4.0, 5.0, 3.0, 5.0, 4.0, 11.0, 8.0, 15.0, 29.0, 14.0, 31.0, 33.0, 55.0, 40.0, 50.0, 53.0, 56.0, 57.0, 41.0, 59.0, 66.0, 58.0, 49.0, 39.0, 34.0, 44.0, 32.0, 21.0, 20.0, 12.0, 15.0, 8.0, 10.0, 2.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.202392578125, -0.19413375854492188, -0.18587493896484375, -0.17761611938476562, -0.1693572998046875, -0.16109848022460938, -0.15283966064453125, -0.14458084106445312, -0.136322021484375, -0.12806320190429688, -0.11980438232421875, -0.11154556274414062, -0.1032867431640625, -0.09502792358398438, -0.08676910400390625, -0.07851028442382812, -0.07025146484375, -0.061992645263671875, -0.05373382568359375, -0.045475006103515625, -0.0372161865234375, -0.028957366943359375, -0.02069854736328125, -0.012439727783203125, -0.004180908203125, 0.004077911376953125, 0.01233673095703125, 0.020595550537109375, 0.0288543701171875, 0.037113189697265625, 0.04537200927734375, 0.053630828857421875, 0.0618896484375, 0.07014846801757812, 0.07840728759765625, 0.08666610717773438, 0.0949249267578125, 0.10318374633789062, 0.11144256591796875, 0.11970138549804688, 0.127960205078125, 0.13621902465820312, 0.14447784423828125, 0.15273666381835938, 0.1609954833984375, 0.16925430297851562, 0.17751312255859375, 0.18577194213867188, 0.19403076171875, 0.20228958129882812, 0.21054840087890625, 0.21880722045898438, 0.2270660400390625, 0.23532485961914062, 0.24358367919921875, 0.2518424987792969, 0.260101318359375, 0.2683601379394531, 0.27661895751953125, 0.2848777770996094, 0.2931365966796875, 0.3013954162597656, 0.30965423583984375, 0.3179130554199219, 0.326171875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 10.0, 11.0, 20.0, 29.0, 52.0, 72.0, 115.0, 205.0, 346.0, 643.0, 1229.0, 2502.0, 5468.0, 13390.0, 38489.0, 128083.0, 389280.0, 320741.0, 98052.0, 30163.0, 10880.0, 4446.0, 2022.0, 1002.0, 540.0, 310.0, 185.0, 101.0, 59.0, 35.0, 22.0, 17.0, 12.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.69140625, -2.60955810546875, -2.5277099609375, -2.44586181640625, -2.364013671875, -2.28216552734375, -2.2003173828125, -2.11846923828125, -2.03662109375, -1.95477294921875, -1.8729248046875, -1.79107666015625, -1.709228515625, -1.62738037109375, -1.5455322265625, -1.46368408203125, -1.3818359375, -1.29998779296875, -1.2181396484375, -1.13629150390625, -1.054443359375, -0.97259521484375, -0.8907470703125, -0.80889892578125, -0.72705078125, -0.64520263671875, -0.5633544921875, -0.48150634765625, -0.399658203125, -0.31781005859375, -0.2359619140625, -0.15411376953125, -0.072265625, 0.00958251953125, 0.0914306640625, 0.17327880859375, 0.255126953125, 0.33697509765625, 0.4188232421875, 0.50067138671875, 0.58251953125, 0.66436767578125, 0.7462158203125, 0.82806396484375, 0.909912109375, 0.99176025390625, 1.0736083984375, 1.15545654296875, 1.2373046875, 1.31915283203125, 1.4010009765625, 1.48284912109375, 1.564697265625, 1.64654541015625, 1.7283935546875, 1.81024169921875, 1.89208984375, 1.97393798828125, 2.0557861328125, 2.13763427734375, 2.219482421875, 2.30133056640625, 2.3831787109375, 2.46502685546875, 2.546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 8.0, 6.0, 4.0, 5.0, 7.0, 11.0, 22.0, 11.0, 22.0, 22.0, 13.0, 28.0, 26.0, 33.0, 29.0, 31.0, 38.0, 45.0, 44.0, 44.0, 39.0, 38.0, 56.0, 31.0, 35.0, 41.0, 32.0, 34.0, 34.0, 23.0, 36.0, 24.0, 32.0, 8.0, 19.0, 10.0, 13.0, 8.0, 9.0, 2.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.0410308837890625, -1.005889892578125, -0.9707489013671875, -0.93560791015625, -0.9004669189453125, -0.865325927734375, -0.8301849365234375, -0.7950439453125, -0.7599029541015625, -0.724761962890625, -0.6896209716796875, -0.65447998046875, -0.6193389892578125, -0.584197998046875, -0.5490570068359375, -0.513916015625, -0.4787750244140625, -0.443634033203125, -0.4084930419921875, -0.37335205078125, -0.3382110595703125, -0.303070068359375, -0.2679290771484375, -0.2327880859375, -0.1976470947265625, -0.162506103515625, -0.1273651123046875, -0.09222412109375, -0.0570831298828125, -0.021942138671875, 0.0131988525390625, 0.04833984375, 0.0834808349609375, 0.118621826171875, 0.1537628173828125, 0.18890380859375, 0.2240447998046875, 0.259185791015625, 0.2943267822265625, 0.3294677734375, 0.3646087646484375, 0.399749755859375, 0.4348907470703125, 0.47003173828125, 0.5051727294921875, 0.540313720703125, 0.5754547119140625, 0.610595703125, 0.6457366943359375, 0.680877685546875, 0.7160186767578125, 0.75115966796875, 0.7863006591796875, 0.821441650390625, 0.8565826416015625, 0.8917236328125, 0.9268646240234375, 0.962005615234375, 0.9971466064453125, 1.03228759765625, 1.0674285888671875, 1.102569580078125, 1.1377105712890625, 1.1728515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 2.0, 5.0, 11.0, 11.0, 26.0, 38.0, 73.0, 155.0, 294.0, 696.0, 1949.0, 6829.0, 32046.0, 277829.0, 628751.0, 80974.0, 13519.0, 3415.0, 1090.0, 431.0, 192.0, 86.0, 64.0, 29.0, 19.0, 10.0, 11.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.834716796875, -8.63037109375, -8.426025390625, -8.2216796875, -8.017333984375, -7.81298828125, -7.608642578125, -7.404296875, -7.199951171875, -6.99560546875, -6.791259765625, -6.5869140625, -6.382568359375, -6.17822265625, -5.973876953125, -5.76953125, -5.565185546875, -5.36083984375, -5.156494140625, -4.9521484375, -4.747802734375, -4.54345703125, -4.339111328125, -4.134765625, -3.930419921875, -3.72607421875, -3.521728515625, -3.3173828125, -3.113037109375, -2.90869140625, -2.704345703125, -2.5, -2.295654296875, -2.09130859375, -1.886962890625, -1.6826171875, -1.478271484375, -1.27392578125, -1.069580078125, -0.865234375, -0.660888671875, -0.45654296875, -0.252197265625, -0.0478515625, 0.156494140625, 0.36083984375, 0.565185546875, 0.76953125, 0.973876953125, 1.17822265625, 1.382568359375, 1.5869140625, 1.791259765625, 1.99560546875, 2.199951171875, 2.404296875, 2.608642578125, 2.81298828125, 3.017333984375, 3.2216796875, 3.426025390625, 3.63037109375, 3.834716796875, 4.0390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 21.0, 29.0, 33.0, 55.0, 75.0, 124.0, 140.0, 172.0, 118.0, 74.0, 37.0, 28.0, 25.0, 18.0, 14.0, 4.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004305839538574219, -0.00041406601667404175, -0.0003975480794906616, -0.0003810301423072815, -0.00036451220512390137, -0.00034799426794052124, -0.0003314763307571411, -0.000314958393573761, -0.00029844045639038086, -0.00028192251920700073, -0.0002654045820236206, -0.0002488866448402405, -0.00023236870765686035, -0.00021585077047348022, -0.0001993328332901001, -0.00018281489610671997, -0.00016629695892333984, -0.00014977902173995972, -0.0001332610845565796, -0.00011674314737319946, -0.00010022521018981934, -8.370727300643921e-05, -6.718933582305908e-05, -5.0671398639678955e-05, -3.415346145629883e-05, -1.76355242729187e-05, -1.1175870895385742e-06, 1.5400350093841553e-05, 3.191828727722168e-05, 4.843622446060181e-05, 6.495416164398193e-05, 8.147209882736206e-05, 9.799003601074219e-05, 0.00011450797319412231, 0.00013102591037750244, 0.00014754384756088257, 0.0001640617847442627, 0.00018057972192764282, 0.00019709765911102295, 0.00021361559629440308, 0.0002301335334777832, 0.00024665147066116333, 0.00026316940784454346, 0.0002796873450279236, 0.0002962052822113037, 0.00031272321939468384, 0.00032924115657806396, 0.0003457590937614441, 0.0003622770309448242, 0.00037879496812820435, 0.00039531290531158447, 0.0004118308424949646, 0.0004283487796783447, 0.00044486671686172485, 0.000461384654045105, 0.0004779025912284851, 0.0004944205284118652, 0.0005109384655952454, 0.0005274564027786255, 0.0005439743399620056, 0.0005604922771453857, 0.0005770102143287659, 0.000593528151512146, 0.0006100460886955261, 0.0006265640258789062]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 5.0, 10.0, 12.0, 18.0, 29.0, 63.0, 81.0, 113.0, 187.0, 289.0, 467.0, 813.0, 1436.0, 2696.0, 5529.0, 12499.0, 31912.0, 101403.0, 342471.0, 371806.0, 115247.0, 35155.0, 13579.0, 6187.0, 2864.0, 1521.0, 861.0, 466.0, 308.0, 198.0, 123.0, 60.0, 58.0, 32.0, 16.0, 15.0, 12.0, 6.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.103515625, -2.996673583984375, -2.88983154296875, -2.782989501953125, -2.6761474609375, -2.569305419921875, -2.46246337890625, -2.355621337890625, -2.248779296875, -2.141937255859375, -2.03509521484375, -1.928253173828125, -1.8214111328125, -1.714569091796875, -1.60772705078125, -1.500885009765625, -1.39404296875, -1.287200927734375, -1.18035888671875, -1.073516845703125, -0.9666748046875, -0.859832763671875, -0.75299072265625, -0.646148681640625, -0.539306640625, -0.432464599609375, -0.32562255859375, -0.218780517578125, -0.1119384765625, -0.005096435546875, 0.10174560546875, 0.208587646484375, 0.3154296875, 0.422271728515625, 0.52911376953125, 0.635955810546875, 0.7427978515625, 0.849639892578125, 0.95648193359375, 1.063323974609375, 1.170166015625, 1.277008056640625, 1.38385009765625, 1.490692138671875, 1.5975341796875, 1.704376220703125, 1.81121826171875, 1.918060302734375, 2.02490234375, 2.131744384765625, 2.23858642578125, 2.345428466796875, 2.4522705078125, 2.559112548828125, 2.66595458984375, 2.772796630859375, 2.879638671875, 2.986480712890625, 3.09332275390625, 3.200164794921875, 3.3070068359375, 3.413848876953125, 3.52069091796875, 3.627532958984375, 3.734375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 6.0, 5.0, 12.0, 7.0, 11.0, 16.0, 28.0, 37.0, 49.0, 65.0, 71.0, 104.0, 107.0, 91.0, 83.0, 68.0, 65.0, 43.0, 34.0, 33.0, 18.0, 7.0, 9.0, 12.0, 8.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.171875, -2.101531982421875, -2.03118896484375, -1.960845947265625, -1.8905029296875, -1.820159912109375, -1.74981689453125, -1.679473876953125, -1.609130859375, -1.538787841796875, -1.46844482421875, -1.398101806640625, -1.3277587890625, -1.257415771484375, -1.18707275390625, -1.116729736328125, -1.04638671875, -0.976043701171875, -0.90570068359375, -0.835357666015625, -0.7650146484375, -0.694671630859375, -0.62432861328125, -0.553985595703125, -0.483642578125, -0.413299560546875, -0.34295654296875, -0.272613525390625, -0.2022705078125, -0.131927490234375, -0.06158447265625, 0.008758544921875, 0.0791015625, 0.149444580078125, 0.21978759765625, 0.290130615234375, 0.3604736328125, 0.430816650390625, 0.50115966796875, 0.571502685546875, 0.641845703125, 0.712188720703125, 0.78253173828125, 0.852874755859375, 0.9232177734375, 0.993560791015625, 1.06390380859375, 1.134246826171875, 1.20458984375, 1.274932861328125, 1.34527587890625, 1.415618896484375, 1.4859619140625, 1.556304931640625, 1.62664794921875, 1.696990966796875, 1.767333984375, 1.837677001953125, 1.90802001953125, 1.978363037109375, 2.0487060546875, 2.119049072265625, 2.18939208984375, 2.259735107421875, 2.330078125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 7.0, 5.0, 8.0, 12.0, 17.0, 40.0, 51.0, 62.0, 114.0, 131.0, 131.0, 126.0, 84.0, 71.0, 48.0, 37.0, 19.0, 9.0, 8.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.410411834716797, -14.842500686645508, -14.274589538574219, -13.70667839050293, -13.13876724243164, -12.570856094360352, -12.002944946289062, -11.435033798217773, -10.867122650146484, -10.299211502075195, -9.731300354003906, -9.163389205932617, -8.595478057861328, -8.027566909790039, -7.459655284881592, -6.891744136810303, -6.3238325119018555, -5.755921363830566, -5.188010215759277, -4.620099067687988, -4.052187919616699, -3.484276533126831, -2.916365146636963, -2.348453998565674, -1.7805428504943848, -1.2126317024230957, -0.6447204351425171, -0.07680916786193848, 0.4911019802093506, 1.0590131282806396, 1.6269245147705078, 2.194835662841797, 2.762746810913086, 3.330657958984375, 3.898569107055664, 4.466480255126953, 5.034391403198242, 5.602302551269531, 6.1702141761779785, 6.738125324249268, 7.306036472320557, 7.873947620391846, 8.441859245300293, 9.009770393371582, 9.577681541442871, 10.14559268951416, 10.71350383758545, 11.281414985656738, 11.849326133728027, 12.417237281799316, 12.985148429870605, 13.553059577941895, 14.120970726013184, 14.688881874084473, 15.256793975830078, 15.824705123901367, 16.392616271972656, 16.960527420043945, 17.528438568115234, 18.096349716186523, 18.664260864257812, 19.2321720123291, 19.80008316040039, 20.36799430847168, 20.93590545654297]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 11.0, 13.0, 8.0, 12.0, 13.0, 14.0, 16.0, 36.0, 38.0, 35.0, 32.0, 48.0, 45.0, 49.0, 68.0, 54.0, 56.0, 61.0, 50.0, 51.0, 50.0, 37.0, 37.0, 30.0, 18.0, 23.0, 18.0, 9.0, 12.0, 7.0, 7.0, 2.0, 7.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.677696228027344, -9.34708309173584, -9.016470909118652, -8.685857772827148, -8.355244636535645, -8.024632453918457, -7.694019317626953, -7.363406658172607, -7.032793998718262, -6.702181339263916, -6.371568202972412, -6.040955543518066, -5.710342884063721, -5.379730224609375, -5.049117088317871, -4.718504428863525, -4.3878912925720215, -4.057278633117676, -3.726665735244751, -3.396052837371826, -3.0654401779174805, -2.7348272800445557, -2.404214382171631, -2.073601722717285, -1.7429888248443604, -1.412376046180725, -1.0817632675170898, -0.751150369644165, -0.4205375909805298, -0.08992481231689453, 0.24068808555603027, 0.571300745010376, 0.9019136428833008, 1.232526421546936, 1.5631392002105713, 1.893752098083496, 2.224364757537842, 2.5549776554107666, 2.8855905532836914, 3.216203212738037, 3.546816110610962, 3.8774290084838867, 4.208041667938232, 4.538654327392578, 4.869267463684082, 5.199880123138428, 5.530492782592773, 5.861105918884277, 6.191718578338623, 6.522331237792969, 6.852944374084473, 7.183557033538818, 7.514169692993164, 7.844782829284668, 8.175395965576172, 8.50600814819336, 8.836621284484863, 9.167234420776367, 9.497846603393555, 9.828459739685059, 10.159072875976562, 10.48968505859375, 10.820298194885254, 11.150911331176758, 11.481523513793945]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 9.0, 10.0, 19.0, 14.0, 27.0, 52.0, 83.0, 149.0, 227.0, 557.0, 1052.0, 2524.0, 6394.0, 18435.0, 61924.0, 273680.0, 3156107.0, 535841.0, 94216.0, 26899.0, 9211.0, 3540.0, 1537.0, 701.0, 391.0, 214.0, 155.0, 83.0, 68.0, 43.0, 20.0, 28.0, 16.0, 13.0, 10.0, 10.0, 3.0, 5.0, 8.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.0531005859375, -4.856201171875, -4.6593017578125, -4.46240234375, -4.2655029296875, -4.068603515625, -3.8717041015625, -3.6748046875, -3.4779052734375, -3.281005859375, -3.0841064453125, -2.88720703125, -2.6903076171875, -2.493408203125, -2.2965087890625, -2.099609375, -1.9027099609375, -1.705810546875, -1.5089111328125, -1.31201171875, -1.1151123046875, -0.918212890625, -0.7213134765625, -0.5244140625, -0.3275146484375, -0.130615234375, 0.0662841796875, 0.26318359375, 0.4600830078125, 0.656982421875, 0.8538818359375, 1.05078125, 1.2476806640625, 1.444580078125, 1.6414794921875, 1.83837890625, 2.0352783203125, 2.232177734375, 2.4290771484375, 2.6259765625, 2.8228759765625, 3.019775390625, 3.2166748046875, 3.41357421875, 3.6104736328125, 3.807373046875, 4.0042724609375, 4.201171875, 4.3980712890625, 4.594970703125, 4.7918701171875, 4.98876953125, 5.1856689453125, 5.382568359375, 5.5794677734375, 5.7763671875, 5.9732666015625, 6.170166015625, 6.3670654296875, 6.56396484375, 6.7608642578125, 6.957763671875, 7.1546630859375, 7.3515625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 11.0, 7.0, 12.0, 22.0, 25.0, 19.0, 34.0, 58.0, 42.0, 51.0, 54.0, 65.0, 60.0, 71.0, 54.0, 58.0, 60.0, 49.0, 45.0, 45.0, 39.0, 18.0, 22.0, 15.0, 19.0, 11.0, 9.0, 5.0, 3.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280517578125, -0.2713050842285156, -0.26209259033203125, -0.2528800964355469, -0.2436676025390625, -0.23445510864257812, -0.22524261474609375, -0.21603012084960938, -0.206817626953125, -0.19760513305664062, -0.18839263916015625, -0.17918014526367188, -0.1699676513671875, -0.16075515747070312, -0.15154266357421875, -0.14233016967773438, -0.13311767578125, -0.12390518188476562, -0.11469268798828125, -0.10548019409179688, -0.0962677001953125, -0.08705520629882812, -0.07784271240234375, -0.06863021850585938, -0.059417724609375, -0.050205230712890625, -0.04099273681640625, -0.031780242919921875, -0.0225677490234375, -0.013355255126953125, -0.00414276123046875, 0.005069732666015625, 0.0142822265625, 0.023494720458984375, 0.03270721435546875, 0.041919708251953125, 0.0511322021484375, 0.060344696044921875, 0.06955718994140625, 0.07876968383789062, 0.087982177734375, 0.09719467163085938, 0.10640716552734375, 0.11561965942382812, 0.1248321533203125, 0.13404464721679688, 0.14325714111328125, 0.15246963500976562, 0.16168212890625, 0.17089462280273438, 0.18010711669921875, 0.18931961059570312, 0.1985321044921875, 0.20774459838867188, 0.21695709228515625, 0.22616958618164062, 0.235382080078125, 0.24459457397460938, 0.25380706787109375, 0.2630195617675781, 0.2722320556640625, 0.2814445495605469, 0.29065704345703125, 0.2998695373535156, 0.30908203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 9.0, 5.0, 11.0, 10.0, 18.0, 11.0, 14.0, 28.0, 36.0, 47.0, 71.0, 140.0, 353.0, 1069.0, 3242.0, 11533.0, 51032.0, 358622.0, 3299443.0, 395795.0, 55226.0, 12172.0, 3432.0, 1050.0, 409.0, 188.0, 90.0, 51.0, 48.0, 31.0, 17.0, 10.0, 11.0, 9.0, 12.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.90625, -8.64825439453125, -8.3902587890625, -8.13226318359375, -7.874267578125, -7.61627197265625, -7.3582763671875, -7.10028076171875, -6.84228515625, -6.58428955078125, -6.3262939453125, -6.06829833984375, -5.810302734375, -5.55230712890625, -5.2943115234375, -5.03631591796875, -4.7783203125, -4.52032470703125, -4.2623291015625, -4.00433349609375, -3.746337890625, -3.48834228515625, -3.2303466796875, -2.97235107421875, -2.71435546875, -2.45635986328125, -2.1983642578125, -1.94036865234375, -1.682373046875, -1.42437744140625, -1.1663818359375, -0.90838623046875, -0.650390625, -0.39239501953125, -0.1343994140625, 0.12359619140625, 0.381591796875, 0.63958740234375, 0.8975830078125, 1.15557861328125, 1.41357421875, 1.67156982421875, 1.9295654296875, 2.18756103515625, 2.445556640625, 2.70355224609375, 2.9615478515625, 3.21954345703125, 3.4775390625, 3.73553466796875, 3.9935302734375, 4.25152587890625, 4.509521484375, 4.76751708984375, 5.0255126953125, 5.28350830078125, 5.54150390625, 5.79949951171875, 6.0574951171875, 6.31549072265625, 6.573486328125, 6.83148193359375, 7.0894775390625, 7.34747314453125, 7.60546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 4.0, 9.0, 7.0, 11.0, 9.0, 16.0, 24.0, 31.0, 31.0, 41.0, 57.0, 72.0, 108.0, 141.0, 182.0, 280.0, 388.0, 764.0, 605.0, 361.0, 233.0, 159.0, 119.0, 80.0, 58.0, 50.0, 48.0, 36.0, 21.0, 26.0, 24.0, 13.0, 11.0, 10.0, 7.0, 7.0, 10.0, 1.0, 5.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7080078125, -0.6870956420898438, -0.6661834716796875, -0.6452713012695312, -0.624359130859375, -0.6034469604492188, -0.5825347900390625, -0.5616226196289062, -0.54071044921875, -0.5197982788085938, -0.4988861083984375, -0.47797393798828125, -0.457061767578125, -0.43614959716796875, -0.4152374267578125, -0.39432525634765625, -0.3734130859375, -0.35250091552734375, -0.3315887451171875, -0.31067657470703125, -0.289764404296875, -0.26885223388671875, -0.2479400634765625, -0.22702789306640625, -0.20611572265625, -0.18520355224609375, -0.1642913818359375, -0.14337921142578125, -0.122467041015625, -0.10155487060546875, -0.0806427001953125, -0.05973052978515625, -0.038818359375, -0.01790618896484375, 0.0030059814453125, 0.02391815185546875, 0.044830322265625, 0.06574249267578125, 0.0866546630859375, 0.10756683349609375, 0.12847900390625, 0.14939117431640625, 0.1703033447265625, 0.19121551513671875, 0.212127685546875, 0.23303985595703125, 0.2539520263671875, 0.27486419677734375, 0.2957763671875, 0.31668853759765625, 0.3376007080078125, 0.35851287841796875, 0.379425048828125, 0.40033721923828125, 0.4212493896484375, 0.44216156005859375, 0.46307373046875, 0.48398590087890625, 0.5048980712890625, 0.5258102416992188, 0.546722412109375, 0.5676345825195312, 0.5885467529296875, 0.6094589233398438, 0.63037109375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 11.0, 31.0, 49.0, 80.0, 141.0, 144.0, 151.0, 154.0, 92.0, 63.0, 34.0, 11.0, 10.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.79248046875, -10.466913223266602, -10.141345977783203, -9.815778732299805, -9.490211486816406, -9.164644241333008, -8.83907699584961, -8.513510704040527, -8.187943458557129, -7.8623762130737305, -7.536808967590332, -7.211241722106934, -6.885674953460693, -6.560107707977295, -6.2345404624938965, -5.908973693847656, -5.5834059715271, -5.257838726043701, -4.932271480560303, -4.6067047119140625, -4.281137466430664, -3.9555702209472656, -3.630002975463867, -3.304435968399048, -2.9788687229156494, -2.653301477432251, -2.3277344703674316, -2.002167224884033, -1.6766000986099243, -1.3510329723358154, -1.025465726852417, -0.6998987197875977, -0.3743314743041992, -0.048764318227767944, 0.27680283784866333, 0.602370023727417, 0.9279371500015259, 1.2535042762756348, 1.5790715217590332, 1.9046385288238525, 2.230205774307251, 2.5557730197906494, 2.8813400268554688, 3.206907272338867, 3.5324745178222656, 3.858041524887085, 4.1836090087890625, 4.509175777435303, 4.834743022918701, 5.1603102684021, 5.485877513885498, 5.811444282531738, 6.137011528015137, 6.462578773498535, 6.788146018981934, 7.113713264465332, 7.4392805099487305, 7.764847755432129, 8.090415000915527, 8.415982246398926, 8.741549491882324, 9.067115783691406, 9.392683029174805, 9.718250274658203, 10.043817520141602]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 3.0, 5.0, 7.0, 13.0, 8.0, 15.0, 11.0, 20.0, 26.0, 27.0, 19.0, 37.0, 25.0, 36.0, 36.0, 34.0, 31.0, 49.0, 44.0, 37.0, 42.0, 43.0, 36.0, 40.0, 57.0, 45.0, 29.0, 30.0, 31.0, 34.0, 23.0, 15.0, 12.0, 10.0, 11.0, 12.0, 7.0, 10.0, 10.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.4861373901367188, -3.382718801498413, -3.2793002128601074, -3.1758813858032227, -3.072462797164917, -2.9690442085266113, -2.8656256198883057, -2.76220703125, -2.6587882041931152, -2.5553696155548096, -2.451951026916504, -2.348532199859619, -2.2451136112213135, -2.141695022583008, -2.038276433944702, -1.9348578453063965, -1.8314392566680908, -1.7280206680297852, -1.62460196018219, -1.5211833715438843, -1.417764663696289, -1.3143460750579834, -1.2109274864196777, -1.107508897781372, -1.0040901899337769, -0.9006715416908264, -0.797252893447876, -0.6938343048095703, -0.5904156565666199, -0.48699700832366943, -0.38357841968536377, -0.28015977144241333, -0.176741361618042, -0.07332272827625275, 0.0300959050655365, 0.13351452350616455, 0.236933171749115, 0.34035181999206543, 0.4437704086303711, 0.5471890568733215, 0.650607705116272, 0.7540263533592224, 0.8574450016021729, 0.9608635902404785, 1.0642821788787842, 1.1677008867263794, 1.271119475364685, 1.3745381832122803, 1.477956771850586, 1.5813753604888916, 1.6847940683364868, 1.7882126569747925, 1.8916313648223877, 1.9950499534606934, 2.098468542098999, 2.2018871307373047, 2.3053059577941895, 2.408724546432495, 2.512143135070801, 2.6155619621276855, 2.718980550765991, 2.822399139404297, 2.9258177280426025, 3.029236316680908, 3.132654905319214]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 12.0, 10.0, 12.0, 25.0, 38.0, 37.0, 106.0, 162.0, 348.0, 848.0, 2409.0, 8774.0, 37859.0, 184855.0, 517752.0, 232330.0, 47465.0, 10706.0, 2971.0, 982.0, 354.0, 178.0, 95.0, 70.0, 46.0, 31.0, 19.0, 11.0, 13.0, 5.0, 7.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.609375, -6.423583984375, -6.23779296875, -6.052001953125, -5.8662109375, -5.680419921875, -5.49462890625, -5.308837890625, -5.123046875, -4.937255859375, -4.75146484375, -4.565673828125, -4.3798828125, -4.194091796875, -4.00830078125, -3.822509765625, -3.63671875, -3.450927734375, -3.26513671875, -3.079345703125, -2.8935546875, -2.707763671875, -2.52197265625, -2.336181640625, -2.150390625, -1.964599609375, -1.77880859375, -1.593017578125, -1.4072265625, -1.221435546875, -1.03564453125, -0.849853515625, -0.6640625, -0.478271484375, -0.29248046875, -0.106689453125, 0.0791015625, 0.264892578125, 0.45068359375, 0.636474609375, 0.822265625, 1.008056640625, 1.19384765625, 1.379638671875, 1.5654296875, 1.751220703125, 1.93701171875, 2.122802734375, 2.30859375, 2.494384765625, 2.68017578125, 2.865966796875, 3.0517578125, 3.237548828125, 3.42333984375, 3.609130859375, 3.794921875, 3.980712890625, 4.16650390625, 4.352294921875, 4.5380859375, 4.723876953125, 4.90966796875, 5.095458984375, 5.28125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 8.0, 14.0, 17.0, 13.0, 21.0, 18.0, 23.0, 28.0, 42.0, 49.0, 54.0, 54.0, 48.0, 51.0, 59.0, 63.0, 55.0, 51.0, 52.0, 51.0, 48.0, 33.0, 24.0, 21.0, 23.0, 23.0, 11.0, 13.0, 11.0, 5.0, 2.0, 9.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.27655792236328125, -0.2669830322265625, -0.25740814208984375, -0.247833251953125, -0.23825836181640625, -0.2286834716796875, -0.21910858154296875, -0.20953369140625, -0.19995880126953125, -0.1903839111328125, -0.18080902099609375, -0.171234130859375, -0.16165924072265625, -0.1520843505859375, -0.14250946044921875, -0.1329345703125, -0.12335968017578125, -0.1137847900390625, -0.10420989990234375, -0.094635009765625, -0.08506011962890625, -0.0754852294921875, -0.06591033935546875, -0.05633544921875, -0.04676055908203125, -0.0371856689453125, -0.02761077880859375, -0.018035888671875, -0.00846099853515625, 0.0011138916015625, 0.01068878173828125, 0.020263671875, 0.02983856201171875, 0.0394134521484375, 0.04898834228515625, 0.058563232421875, 0.06813812255859375, 0.0777130126953125, 0.08728790283203125, 0.09686279296875, 0.10643768310546875, 0.1160125732421875, 0.12558746337890625, 0.135162353515625, 0.14473724365234375, 0.1543121337890625, 0.16388702392578125, 0.1734619140625, 0.18303680419921875, 0.1926116943359375, 0.20218658447265625, 0.211761474609375, 0.22133636474609375, 0.2309112548828125, 0.24048614501953125, 0.25006103515625, 0.25963592529296875, 0.2692108154296875, 0.27878570556640625, 0.288360595703125, 0.29793548583984375, 0.3075103759765625, 0.31708526611328125, 0.32666015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 12.0, 14.0, 20.0, 21.0, 38.0, 65.0, 100.0, 157.0, 252.0, 438.0, 766.0, 1556.0, 3724.0, 9858.0, 31056.0, 108213.0, 340828.0, 370744.0, 125672.0, 35821.0, 11264.0, 4141.0, 1727.0, 865.0, 472.0, 295.0, 153.0, 95.0, 66.0, 39.0, 33.0, 13.0, 13.0, 4.0, 10.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5703125, -5.41998291015625, -5.2696533203125, -5.11932373046875, -4.968994140625, -4.81866455078125, -4.6683349609375, -4.51800537109375, -4.36767578125, -4.21734619140625, -4.0670166015625, -3.91668701171875, -3.766357421875, -3.61602783203125, -3.4656982421875, -3.31536865234375, -3.1650390625, -3.01470947265625, -2.8643798828125, -2.71405029296875, -2.563720703125, -2.41339111328125, -2.2630615234375, -2.11273193359375, -1.96240234375, -1.81207275390625, -1.6617431640625, -1.51141357421875, -1.361083984375, -1.21075439453125, -1.0604248046875, -0.91009521484375, -0.759765625, -0.60943603515625, -0.4591064453125, -0.30877685546875, -0.158447265625, -0.00811767578125, 0.1422119140625, 0.29254150390625, 0.44287109375, 0.59320068359375, 0.7435302734375, 0.89385986328125, 1.044189453125, 1.19451904296875, 1.3448486328125, 1.49517822265625, 1.6455078125, 1.79583740234375, 1.9461669921875, 2.09649658203125, 2.246826171875, 2.39715576171875, 2.5474853515625, 2.69781494140625, 2.84814453125, 2.99847412109375, 3.1488037109375, 3.29913330078125, 3.449462890625, 3.59979248046875, 3.7501220703125, 3.90045166015625, 4.05078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 9.0, 11.0, 13.0, 10.0, 20.0, 23.0, 14.0, 31.0, 33.0, 31.0, 39.0, 42.0, 42.0, 43.0, 46.0, 46.0, 51.0, 39.0, 35.0, 32.0, 44.0, 38.0, 46.0, 39.0, 33.0, 27.0, 25.0, 18.0, 25.0, 11.0, 14.0, 16.0, 13.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.021484375, -1.9655303955078125, -1.909576416015625, -1.8536224365234375, -1.79766845703125, -1.7417144775390625, -1.685760498046875, -1.6298065185546875, -1.5738525390625, -1.5178985595703125, -1.461944580078125, -1.4059906005859375, -1.35003662109375, -1.2940826416015625, -1.238128662109375, -1.1821746826171875, -1.126220703125, -1.0702667236328125, -1.014312744140625, -0.9583587646484375, -0.90240478515625, -0.8464508056640625, -0.790496826171875, -0.7345428466796875, -0.6785888671875, -0.6226348876953125, -0.566680908203125, -0.5107269287109375, -0.45477294921875, -0.3988189697265625, -0.342864990234375, -0.2869110107421875, -0.23095703125, -0.1750030517578125, -0.119049072265625, -0.0630950927734375, -0.00714111328125, 0.0488128662109375, 0.104766845703125, 0.1607208251953125, 0.2166748046875, 0.2726287841796875, 0.328582763671875, 0.3845367431640625, 0.44049072265625, 0.4964447021484375, 0.552398681640625, 0.6083526611328125, 0.664306640625, 0.7202606201171875, 0.776214599609375, 0.8321685791015625, 0.88812255859375, 0.9440765380859375, 1.000030517578125, 1.0559844970703125, 1.1119384765625, 1.1678924560546875, 1.223846435546875, 1.2798004150390625, 1.33575439453125, 1.3917083740234375, 1.447662353515625, 1.5036163330078125, 1.5595703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 9.0, 3.0, 8.0, 19.0, 25.0, 66.0, 131.0, 288.0, 835.0, 2765.0, 14930.0, 237012.0, 739626.0, 44896.0, 5637.0, 1420.0, 501.0, 174.0, 80.0, 53.0, 25.0, 18.0, 12.0, 6.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.1171875, -12.799072265625, -12.48095703125, -12.162841796875, -11.8447265625, -11.526611328125, -11.20849609375, -10.890380859375, -10.572265625, -10.254150390625, -9.93603515625, -9.617919921875, -9.2998046875, -8.981689453125, -8.66357421875, -8.345458984375, -8.02734375, -7.709228515625, -7.39111328125, -7.072998046875, -6.7548828125, -6.436767578125, -6.11865234375, -5.800537109375, -5.482421875, -5.164306640625, -4.84619140625, -4.528076171875, -4.2099609375, -3.891845703125, -3.57373046875, -3.255615234375, -2.9375, -2.619384765625, -2.30126953125, -1.983154296875, -1.6650390625, -1.346923828125, -1.02880859375, -0.710693359375, -0.392578125, -0.074462890625, 0.24365234375, 0.561767578125, 0.8798828125, 1.197998046875, 1.51611328125, 1.834228515625, 2.15234375, 2.470458984375, 2.78857421875, 3.106689453125, 3.4248046875, 3.742919921875, 4.06103515625, 4.379150390625, 4.697265625, 5.015380859375, 5.33349609375, 5.651611328125, 5.9697265625, 6.287841796875, 6.60595703125, 6.924072265625, 7.2421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 10.0, 20.0, 25.0, 47.0, 66.0, 79.0, 130.0, 144.0, 124.0, 92.0, 82.0, 48.0, 38.0, 22.0, 14.0, 19.0, 4.0, 10.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009655952453613281, -0.0009393468499183655, -0.0009130984544754028, -0.0008868500590324402, -0.0008606016635894775, -0.0008343532681465149, -0.0008081048727035522, -0.0007818564772605896, -0.000755608081817627, -0.0007293596863746643, -0.0007031112909317017, -0.000676862895488739, -0.0006506145000457764, -0.0006243661046028137, -0.0005981177091598511, -0.0005718693137168884, -0.0005456209182739258, -0.0005193725228309631, -0.0004931241273880005, -0.00046687573194503784, -0.0004406273365020752, -0.00041437894105911255, -0.0003881305456161499, -0.00036188215017318726, -0.0003356337547302246, -0.00030938535928726196, -0.0002831369638442993, -0.00025688856840133667, -0.00023064017295837402, -0.00020439177751541138, -0.00017814338207244873, -0.00015189498662948608, -0.00012564659118652344, -9.939819574356079e-05, -7.314980030059814e-05, -4.69014048576355e-05, -2.065300941467285e-05, 5.595386028289795e-06, 3.184378147125244e-05, 5.809217691421509e-05, 8.434057235717773e-05, 0.00011058896780014038, 0.00013683736324310303, 0.00016308575868606567, 0.00018933415412902832, 0.00021558254957199097, 0.0002418309450149536, 0.00026807934045791626, 0.0002943277359008789, 0.00032057613134384155, 0.0003468245267868042, 0.00037307292222976685, 0.0003993213176727295, 0.00042556971311569214, 0.0004518181085586548, 0.00047806650400161743, 0.0005043148994445801, 0.0005305632948875427, 0.0005568116903305054, 0.000583060085773468, 0.0006093084812164307, 0.0006355568766593933, 0.000661805272102356, 0.0006880536675453186, 0.0007143020629882812]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 8.0, 5.0, 12.0, 22.0, 16.0, 21.0, 32.0, 48.0, 63.0, 99.0, 151.0, 243.0, 316.0, 504.0, 908.0, 1438.0, 2762.0, 5699.0, 14600.0, 55679.0, 365186.0, 492475.0, 77674.0, 17497.0, 6315.0, 2900.0, 1499.0, 840.0, 521.0, 332.0, 224.0, 135.0, 101.0, 71.0, 50.0, 29.0, 26.0, 12.0, 7.0, 11.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.92578125, -5.7352294921875, -5.544677734375, -5.3541259765625, -5.16357421875, -4.9730224609375, -4.782470703125, -4.5919189453125, -4.4013671875, -4.2108154296875, -4.020263671875, -3.8297119140625, -3.63916015625, -3.4486083984375, -3.258056640625, -3.0675048828125, -2.876953125, -2.6864013671875, -2.495849609375, -2.3052978515625, -2.11474609375, -1.9241943359375, -1.733642578125, -1.5430908203125, -1.3525390625, -1.1619873046875, -0.971435546875, -0.7808837890625, -0.59033203125, -0.3997802734375, -0.209228515625, -0.0186767578125, 0.171875, 0.3624267578125, 0.552978515625, 0.7435302734375, 0.93408203125, 1.1246337890625, 1.315185546875, 1.5057373046875, 1.6962890625, 1.8868408203125, 2.077392578125, 2.2679443359375, 2.45849609375, 2.6490478515625, 2.839599609375, 3.0301513671875, 3.220703125, 3.4112548828125, 3.601806640625, 3.7923583984375, 3.98291015625, 4.1734619140625, 4.364013671875, 4.5545654296875, 4.7451171875, 4.9356689453125, 5.126220703125, 5.3167724609375, 5.50732421875, 5.6978759765625, 5.888427734375, 6.0789794921875, 6.26953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 15.0, 25.0, 33.0, 51.0, 93.0, 145.0, 217.0, 174.0, 102.0, 49.0, 37.0, 20.0, 13.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.940185546875, -3.80224609375, -3.664306640625, -3.5263671875, -3.388427734375, -3.25048828125, -3.112548828125, -2.974609375, -2.836669921875, -2.69873046875, -2.560791015625, -2.4228515625, -2.284912109375, -2.14697265625, -2.009033203125, -1.87109375, -1.733154296875, -1.59521484375, -1.457275390625, -1.3193359375, -1.181396484375, -1.04345703125, -0.905517578125, -0.767578125, -0.629638671875, -0.49169921875, -0.353759765625, -0.2158203125, -0.077880859375, 0.06005859375, 0.197998046875, 0.3359375, 0.473876953125, 0.61181640625, 0.749755859375, 0.8876953125, 1.025634765625, 1.16357421875, 1.301513671875, 1.439453125, 1.577392578125, 1.71533203125, 1.853271484375, 1.9912109375, 2.129150390625, 2.26708984375, 2.405029296875, 2.54296875, 2.680908203125, 2.81884765625, 2.956787109375, 3.0947265625, 3.232666015625, 3.37060546875, 3.508544921875, 3.646484375, 3.784423828125, 3.92236328125, 4.060302734375, 4.1982421875, 4.336181640625, 4.47412109375, 4.612060546875, 4.75]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 13.0, 32.0, 41.0, 61.0, 116.0, 158.0, 162.0, 160.0, 116.0, 63.0, 22.0, 17.0, 8.0, 8.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.91203308105469, -42.69949722290039, -41.48695755004883, -40.27442169189453, -39.06188201904297, -37.84934616088867, -36.63680648803711, -35.42427062988281, -34.21173095703125, -32.99919509887695, -31.78665542602539, -30.57411766052246, -29.36157989501953, -28.149044036865234, -26.936506271362305, -25.723968505859375, -24.511432647705078, -23.29889488220215, -22.08635711669922, -20.87381935119629, -19.66128158569336, -18.448745727539062, -17.236207962036133, -16.023670196533203, -14.811132431030273, -13.598594665527344, -12.386056900024414, -11.1735200881958, -9.960982322692871, -8.748444557189941, -7.53590726852417, -6.323369979858398, -5.110832214355469, -3.898294687271118, -2.6857571601867676, -1.473219633102417, -0.2606821060180664, 0.9518556594848633, 2.1643929481506348, 3.3769302368164062, 4.589468002319336, 5.802005767822266, 7.014543056488037, 8.227080345153809, 9.439618110656738, 10.652155876159668, 11.864692687988281, 13.077230453491211, 14.28976821899414, 15.50230598449707, 16.71484375, 17.92738151550293, 19.13991928100586, 20.352455139160156, 21.564992904663086, 22.777530670166016, 23.990068435668945, 25.202606201171875, 26.415143966674805, 27.627681732177734, 28.84021759033203, 30.052757263183594, 31.26529312133789, 32.47782897949219, 33.69036865234375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 9.0, 7.0, 10.0, 13.0, 20.0, 20.0, 20.0, 20.0, 21.0, 33.0, 34.0, 47.0, 36.0, 30.0, 31.0, 34.0, 48.0, 42.0, 38.0, 44.0, 40.0, 41.0, 40.0, 30.0, 32.0, 41.0, 25.0, 29.0, 17.0, 20.0, 11.0, 10.0, 17.0, 9.0, 15.0, 12.0, 6.0, 9.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-14.64193058013916, -14.238665580749512, -13.83540153503418, -13.432136535644531, -13.028871536254883, -12.62560749053955, -12.222342491149902, -11.81907844543457, -11.415813446044922, -11.012548446655273, -10.609284400939941, -10.206019401550293, -9.802754402160645, -9.399490356445312, -8.996225357055664, -8.592960357666016, -8.189695358276367, -7.786430835723877, -7.3831658363342285, -6.979901313781738, -6.576636791229248, -6.173372268676758, -5.770107269287109, -5.366842746734619, -4.963578224182129, -4.560313701629639, -4.15704870223999, -3.7537841796875, -3.3505196571350098, -2.9472548961639404, -2.543990135192871, -2.140725612640381, -1.7374610900878906, -1.3341964483261108, -0.9309317469596863, -0.5276670455932617, -0.12440240383148193, 0.27886223793029785, 0.6821269989013672, 1.0853915214538574, 1.4886562824249268, 1.8919209241867065, 2.2951855659484863, 2.6984503269195557, 3.101715087890625, 3.5049796104431152, 3.9082443714141846, 4.311509132385254, 4.714773654937744, 5.118038177490234, 5.521303176879883, 5.924567699432373, 6.327832221984863, 6.731097221374512, 7.134361743927002, 7.537626266479492, 7.940891265869141, 8.344156265258789, 8.747420310974121, 9.15068531036377, 9.553950309753418, 9.95721435546875, 10.360479354858398, 10.763744354248047, 11.167008399963379]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 10.0, 12.0, 18.0, 16.0, 16.0, 34.0, 80.0, 93.0, 146.0, 320.0, 580.0, 1353.0, 3766.0, 12153.0, 50585.0, 308386.0, 3492631.0, 262019.0, 44801.0, 11230.0, 3460.0, 1268.0, 551.0, 247.0, 128.0, 89.0, 50.0, 43.0, 35.0, 24.0, 18.0, 17.0, 24.0, 17.0, 7.0, 12.0, 10.0, 4.0, 5.0, 3.0, 6.0, 8.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.78515625, -6.52874755859375, -6.2723388671875, -6.01593017578125, -5.759521484375, -5.50311279296875, -5.2467041015625, -4.99029541015625, -4.73388671875, -4.47747802734375, -4.2210693359375, -3.96466064453125, -3.708251953125, -3.45184326171875, -3.1954345703125, -2.93902587890625, -2.6826171875, -2.42620849609375, -2.1697998046875, -1.91339111328125, -1.656982421875, -1.40057373046875, -1.1441650390625, -0.88775634765625, -0.63134765625, -0.37493896484375, -0.1185302734375, 0.13787841796875, 0.394287109375, 0.65069580078125, 0.9071044921875, 1.16351318359375, 1.419921875, 1.67633056640625, 1.9327392578125, 2.18914794921875, 2.445556640625, 2.70196533203125, 2.9583740234375, 3.21478271484375, 3.47119140625, 3.72760009765625, 3.9840087890625, 4.24041748046875, 4.496826171875, 4.75323486328125, 5.0096435546875, 5.26605224609375, 5.5224609375, 5.77886962890625, 6.0352783203125, 6.29168701171875, 6.548095703125, 6.80450439453125, 7.0609130859375, 7.31732177734375, 7.57373046875, 7.83013916015625, 8.0865478515625, 8.34295654296875, 8.599365234375, 8.85577392578125, 9.1121826171875, 9.36859130859375, 9.625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 6.0, 13.0, 19.0, 13.0, 20.0, 29.0, 23.0, 44.0, 49.0, 46.0, 52.0, 46.0, 56.0, 59.0, 56.0, 66.0, 59.0, 59.0, 44.0, 46.0, 45.0, 36.0, 22.0, 19.0, 12.0, 17.0, 13.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.403564453125, -0.3905754089355469, -0.37758636474609375, -0.3645973205566406, -0.3516082763671875, -0.3386192321777344, -0.32563018798828125, -0.3126411437988281, -0.299652099609375, -0.2866630554199219, -0.27367401123046875, -0.2606849670410156, -0.2476959228515625, -0.23470687866210938, -0.22171783447265625, -0.20872879028320312, -0.19573974609375, -0.18275070190429688, -0.16976165771484375, -0.15677261352539062, -0.1437835693359375, -0.13079452514648438, -0.11780548095703125, -0.10481643676757812, -0.091827392578125, -0.07883834838867188, -0.06584930419921875, -0.052860260009765625, -0.0398712158203125, -0.026882171630859375, -0.01389312744140625, -0.000904083251953125, 0.0120849609375, 0.025074005126953125, 0.03806304931640625, 0.051052093505859375, 0.0640411376953125, 0.07703018188476562, 0.09001922607421875, 0.10300827026367188, 0.115997314453125, 0.12898635864257812, 0.14197540283203125, 0.15496444702148438, 0.1679534912109375, 0.18094253540039062, 0.19393157958984375, 0.20692062377929688, 0.21990966796875, 0.23289871215820312, 0.24588775634765625, 0.2588768005371094, 0.2718658447265625, 0.2848548889160156, 0.29784393310546875, 0.3108329772949219, 0.323822021484375, 0.3368110656738281, 0.34980010986328125, 0.3627891540527344, 0.3757781982421875, 0.3887672424316406, 0.40175628662109375, 0.4147453308105469, 0.427734375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 6.0, 17.0, 48.0, 64.0, 142.0, 255.0, 576.0, 1748.0, 5871.0, 24263.0, 141825.0, 2615822.0, 1267949.0, 108600.0, 19540.0, 4826.0, 1564.0, 613.0, 260.0, 138.0, 63.0, 60.0, 14.0, 10.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6328125, -9.34033203125, -9.0478515625, -8.75537109375, -8.462890625, -8.17041015625, -7.8779296875, -7.58544921875, -7.29296875, -7.00048828125, -6.7080078125, -6.41552734375, -6.123046875, -5.83056640625, -5.5380859375, -5.24560546875, -4.953125, -4.66064453125, -4.3681640625, -4.07568359375, -3.783203125, -3.49072265625, -3.1982421875, -2.90576171875, -2.61328125, -2.32080078125, -2.0283203125, -1.73583984375, -1.443359375, -1.15087890625, -0.8583984375, -0.56591796875, -0.2734375, 0.01904296875, 0.3115234375, 0.60400390625, 0.896484375, 1.18896484375, 1.4814453125, 1.77392578125, 2.06640625, 2.35888671875, 2.6513671875, 2.94384765625, 3.236328125, 3.52880859375, 3.8212890625, 4.11376953125, 4.40625, 4.69873046875, 4.9912109375, 5.28369140625, 5.576171875, 5.86865234375, 6.1611328125, 6.45361328125, 6.74609375, 7.03857421875, 7.3310546875, 7.62353515625, 7.916015625, 8.20849609375, 8.5009765625, 8.79345703125, 9.0859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 10.0, 8.0, 15.0, 19.0, 32.0, 29.0, 39.0, 63.0, 75.0, 121.0, 142.0, 190.0, 300.0, 607.0, 1167.0, 393.0, 234.0, 168.0, 131.0, 74.0, 67.0, 45.0, 34.0, 27.0, 20.0, 8.0, 17.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87255859375, -0.8350296020507812, -0.7975006103515625, -0.7599716186523438, -0.722442626953125, -0.6849136352539062, -0.6473846435546875, -0.6098556518554688, -0.57232666015625, -0.5347976684570312, -0.4972686767578125, -0.45973968505859375, -0.422210693359375, -0.38468170166015625, -0.3471527099609375, -0.30962371826171875, -0.2720947265625, -0.23456573486328125, -0.1970367431640625, -0.15950775146484375, -0.121978759765625, -0.08444976806640625, -0.0469207763671875, -0.00939178466796875, 0.02813720703125, 0.06566619873046875, 0.1031951904296875, 0.14072418212890625, 0.178253173828125, 0.21578216552734375, 0.2533111572265625, 0.29084014892578125, 0.328369140625, 0.36589813232421875, 0.4034271240234375, 0.44095611572265625, 0.478485107421875, 0.5160140991210938, 0.5535430908203125, 0.5910720825195312, 0.62860107421875, 0.6661300659179688, 0.7036590576171875, 0.7411880493164062, 0.778717041015625, 0.8162460327148438, 0.8537750244140625, 0.8913040161132812, 0.9288330078125, 0.9663619995117188, 1.0038909912109375, 1.0414199829101562, 1.078948974609375, 1.1164779663085938, 1.1540069580078125, 1.1915359497070312, 1.22906494140625, 1.2665939331054688, 1.3041229248046875, 1.3416519165039062, 1.379180908203125, 1.4167098999023438, 1.4542388916015625, 1.4917678833007812, 1.529296875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 6.0, 12.0, 21.0, 29.0, 57.0, 114.0, 146.0, 170.0, 149.0, 107.0, 83.0, 50.0, 28.0, 13.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.02840805053711, -9.589086532592773, -9.149764060974121, -8.710442543029785, -8.27112102508545, -7.831799030303955, -7.392477035522461, -6.953155517578125, -6.513833522796631, -6.074511528015137, -5.635190010070801, -5.195868015289307, -4.7565460205078125, -4.317224502563477, -3.8779025077819824, -3.4385807514190674, -2.9992589950561523, -2.5599372386932373, -2.1206154823303223, -1.6812934875488281, -1.241971731185913, -0.802649974822998, -0.3633279800415039, 0.07599377632141113, 0.5153155326843262, 0.954637348651886, 1.3939591646194458, 1.8332810401916504, 2.2726027965545654, 2.7119245529174805, 3.1512465476989746, 3.5905683040618896, 4.029890060424805, 4.469212055206299, 4.908533573150635, 5.347855567932129, 5.787177085876465, 6.226499080657959, 6.665821075439453, 7.105142593383789, 7.544464588165283, 7.983786582946777, 8.423108100891113, 8.862430572509766, 9.301752090454102, 9.741073608398438, 10.180395126342773, 10.619717597961426, 11.059039115905762, 11.498360633850098, 11.93768310546875, 12.377004623413086, 12.816326141357422, 13.255647659301758, 13.69497013092041, 14.134291648864746, 14.573614120483398, 15.012935638427734, 15.452258110046387, 15.891579627990723, 16.330902099609375, 16.77022361755371, 17.209545135498047, 17.648866653442383, 18.08818817138672]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 5.0, 9.0, 9.0, 13.0, 16.0, 13.0, 22.0, 28.0, 15.0, 35.0, 28.0, 44.0, 36.0, 45.0, 30.0, 35.0, 45.0, 47.0, 40.0, 41.0, 47.0, 38.0, 35.0, 42.0, 39.0, 38.0, 28.0, 23.0, 19.0, 22.0, 12.0, 14.0, 14.0, 11.0, 8.0, 10.0, 9.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.598965644836426, -4.44852876663208, -4.298092365264893, -4.147655487060547, -3.997218608856201, -3.8467819690704346, -3.696345329284668, -3.5459084510803223, -3.3954718112945557, -3.245035171508789, -3.0945982933044434, -2.9441616535186768, -2.79372501373291, -2.6432881355285645, -2.492851495742798, -2.3424148559570312, -2.1919779777526855, -2.041541337966919, -1.8911044597625732, -1.7406678199768066, -1.5902310609817505, -1.4397943019866943, -1.2893576622009277, -1.1389209032058716, -0.9884841442108154, -0.8380473852157593, -0.6876106858253479, -0.5371739864349365, -0.38673722743988037, -0.23630046844482422, -0.08586376905441284, 0.06457293033599854, 0.21500921249389648, 0.36544594168663025, 0.515882670879364, 0.6663193702697754, 0.8167561292648315, 0.9671928882598877, 1.1176295280456543, 1.2680662870407104, 1.4185030460357666, 1.5689398050308228, 1.719376564025879, 1.8698132038116455, 2.020249843597412, 2.170686721801758, 2.3211233615875244, 2.471560001373291, 2.6219968795776367, 2.7724335193634033, 2.922870397567749, 3.0733070373535156, 3.2237439155578613, 3.374180555343628, 3.5246171951293945, 3.6750540733337402, 3.825490713119507, 3.9759273529052734, 4.126364231109619, 4.276801109313965, 4.427237510681152, 4.577674388885498, 4.728111267089844, 4.878547668457031, 5.028984546661377]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 8.0, 15.0, 18.0, 20.0, 31.0, 40.0, 55.0, 92.0, 176.0, 320.0, 580.0, 1305.0, 3260.0, 7908.0, 22009.0, 60333.0, 158540.0, 318209.0, 278384.0, 123321.0, 46137.0, 16897.0, 6321.0, 2401.0, 1035.0, 493.0, 221.0, 140.0, 100.0, 46.0, 35.0, 33.0, 12.0, 14.0, 8.0, 3.0, 6.0, 7.0, 1.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.509765625, -3.392242431640625, -3.27471923828125, -3.157196044921875, -3.0396728515625, -2.922149658203125, -2.80462646484375, -2.687103271484375, -2.569580078125, -2.452056884765625, -2.33453369140625, -2.217010498046875, -2.0994873046875, -1.981964111328125, -1.86444091796875, -1.746917724609375, -1.62939453125, -1.511871337890625, -1.39434814453125, -1.276824951171875, -1.1593017578125, -1.041778564453125, -0.92425537109375, -0.806732177734375, -0.689208984375, -0.571685791015625, -0.45416259765625, -0.336639404296875, -0.2191162109375, -0.101593017578125, 0.01593017578125, 0.133453369140625, 0.2509765625, 0.368499755859375, 0.48602294921875, 0.603546142578125, 0.7210693359375, 0.838592529296875, 0.95611572265625, 1.073638916015625, 1.191162109375, 1.308685302734375, 1.42620849609375, 1.543731689453125, 1.6612548828125, 1.778778076171875, 1.89630126953125, 2.013824462890625, 2.13134765625, 2.248870849609375, 2.36639404296875, 2.483917236328125, 2.6014404296875, 2.718963623046875, 2.83648681640625, 2.954010009765625, 3.071533203125, 3.189056396484375, 3.30657958984375, 3.424102783203125, 3.5416259765625, 3.659149169921875, 3.77667236328125, 3.894195556640625, 4.01171875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 14.0, 21.0, 20.0, 21.0, 26.0, 28.0, 41.0, 43.0, 38.0, 48.0, 41.0, 49.0, 69.0, 52.0, 66.0, 69.0, 60.0, 36.0, 53.0, 35.0, 30.0, 25.0, 20.0, 21.0, 12.0, 11.0, 8.0, 10.0, 8.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.57080078125, -0.5566215515136719, -0.5424423217773438, -0.5282630920410156, -0.5140838623046875, -0.4999046325683594, -0.48572540283203125, -0.4715461730957031, -0.457366943359375, -0.4431877136230469, -0.42900848388671875, -0.4148292541503906, -0.4006500244140625, -0.3864707946777344, -0.37229156494140625, -0.3581123352050781, -0.34393310546875, -0.3297538757324219, -0.31557464599609375, -0.3013954162597656, -0.2872161865234375, -0.2730369567871094, -0.25885772705078125, -0.24467849731445312, -0.230499267578125, -0.21632003784179688, -0.20214080810546875, -0.18796157836914062, -0.1737823486328125, -0.15960311889648438, -0.14542388916015625, -0.13124465942382812, -0.1170654296875, -0.10288619995117188, -0.08870697021484375, -0.07452774047851562, -0.0603485107421875, -0.046169281005859375, -0.03199005126953125, -0.017810821533203125, -0.003631591796875, 0.010547637939453125, 0.02472686767578125, 0.038906097412109375, 0.0530853271484375, 0.06726455688476562, 0.08144378662109375, 0.09562301635742188, 0.10980224609375, 0.12398147583007812, 0.13816070556640625, 0.15233993530273438, 0.1665191650390625, 0.18069839477539062, 0.19487762451171875, 0.20905685424804688, 0.223236083984375, 0.23741531372070312, 0.25159454345703125, 0.2657737731933594, 0.2799530029296875, 0.2941322326660156, 0.30831146240234375, 0.3224906921386719, 0.336669921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 12.0, 14.0, 19.0, 17.0, 33.0, 60.0, 62.0, 85.0, 96.0, 198.0, 276.0, 435.0, 748.0, 1431.0, 3074.0, 7822.0, 21355.0, 64223.0, 191617.0, 391102.0, 238895.0, 82547.0, 27043.0, 9681.0, 3867.0, 1600.0, 852.0, 493.0, 288.0, 179.0, 122.0, 71.0, 58.0, 46.0, 39.0, 22.0, 14.0, 19.0, 10.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-4.7578125, -4.61627197265625, -4.4747314453125, -4.33319091796875, -4.191650390625, -4.05010986328125, -3.9085693359375, -3.76702880859375, -3.62548828125, -3.48394775390625, -3.3424072265625, -3.20086669921875, -3.059326171875, -2.91778564453125, -2.7762451171875, -2.63470458984375, -2.4931640625, -2.35162353515625, -2.2100830078125, -2.06854248046875, -1.927001953125, -1.78546142578125, -1.6439208984375, -1.50238037109375, -1.36083984375, -1.21929931640625, -1.0777587890625, -0.93621826171875, -0.794677734375, -0.65313720703125, -0.5115966796875, -0.37005615234375, -0.228515625, -0.08697509765625, 0.0545654296875, 0.19610595703125, 0.337646484375, 0.47918701171875, 0.6207275390625, 0.76226806640625, 0.90380859375, 1.04534912109375, 1.1868896484375, 1.32843017578125, 1.469970703125, 1.61151123046875, 1.7530517578125, 1.89459228515625, 2.0361328125, 2.17767333984375, 2.3192138671875, 2.46075439453125, 2.602294921875, 2.74383544921875, 2.8853759765625, 3.02691650390625, 3.16845703125, 3.30999755859375, 3.4515380859375, 3.59307861328125, 3.734619140625, 3.87615966796875, 4.0177001953125, 4.15924072265625, 4.30078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 8.0, 9.0, 9.0, 14.0, 14.0, 21.0, 13.0, 20.0, 24.0, 28.0, 23.0, 29.0, 26.0, 37.0, 35.0, 40.0, 33.0, 39.0, 39.0, 38.0, 49.0, 50.0, 37.0, 42.0, 47.0, 28.0, 29.0, 28.0, 24.0, 21.0, 22.0, 31.0, 14.0, 13.0, 13.0, 14.0, 6.0, 7.0, 5.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.4453125, -2.3736572265625, -2.302001953125, -2.2303466796875, -2.15869140625, -2.0870361328125, -2.015380859375, -1.9437255859375, -1.8720703125, -1.8004150390625, -1.728759765625, -1.6571044921875, -1.58544921875, -1.5137939453125, -1.442138671875, -1.3704833984375, -1.298828125, -1.2271728515625, -1.155517578125, -1.0838623046875, -1.01220703125, -0.9405517578125, -0.868896484375, -0.7972412109375, -0.7255859375, -0.6539306640625, -0.582275390625, -0.5106201171875, -0.43896484375, -0.3673095703125, -0.295654296875, -0.2239990234375, -0.15234375, -0.0806884765625, -0.009033203125, 0.0626220703125, 0.13427734375, 0.2059326171875, 0.277587890625, 0.3492431640625, 0.4208984375, 0.4925537109375, 0.564208984375, 0.6358642578125, 0.70751953125, 0.7791748046875, 0.850830078125, 0.9224853515625, 0.994140625, 1.0657958984375, 1.137451171875, 1.2091064453125, 1.28076171875, 1.3524169921875, 1.424072265625, 1.4957275390625, 1.5673828125, 1.6390380859375, 1.710693359375, 1.7823486328125, 1.85400390625, 1.9256591796875, 1.997314453125, 2.0689697265625, 2.140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 3.0, 3.0, 4.0, 11.0, 14.0, 18.0, 26.0, 22.0, 50.0, 144.0, 274.0, 695.0, 2039.0, 7063.0, 33187.0, 253562.0, 631835.0, 97086.0, 16226.0, 4138.0, 1291.0, 460.0, 173.0, 95.0, 52.0, 26.0, 15.0, 11.0, 6.0, 4.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.05078125, -5.88848876953125, -5.7261962890625, -5.56390380859375, -5.401611328125, -5.23931884765625, -5.0770263671875, -4.91473388671875, -4.75244140625, -4.59014892578125, -4.4278564453125, -4.26556396484375, -4.103271484375, -3.94097900390625, -3.7786865234375, -3.61639404296875, -3.4541015625, -3.29180908203125, -3.1295166015625, -2.96722412109375, -2.804931640625, -2.64263916015625, -2.4803466796875, -2.31805419921875, -2.15576171875, -1.99346923828125, -1.8311767578125, -1.66888427734375, -1.506591796875, -1.34429931640625, -1.1820068359375, -1.01971435546875, -0.857421875, -0.69512939453125, -0.5328369140625, -0.37054443359375, -0.208251953125, -0.04595947265625, 0.1163330078125, 0.27862548828125, 0.44091796875, 0.60321044921875, 0.7655029296875, 0.92779541015625, 1.090087890625, 1.25238037109375, 1.4146728515625, 1.57696533203125, 1.7392578125, 1.90155029296875, 2.0638427734375, 2.22613525390625, 2.388427734375, 2.55072021484375, 2.7130126953125, 2.87530517578125, 3.03759765625, 3.19989013671875, 3.3621826171875, 3.52447509765625, 3.686767578125, 3.84906005859375, 4.0113525390625, 4.17364501953125, 4.3359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 5.0, 9.0, 5.0, 9.0, 10.0, 17.0, 18.0, 31.0, 35.0, 52.0, 72.0, 82.0, 100.0, 153.0, 78.0, 71.0, 65.0, 51.0, 28.0, 16.0, 23.0, 23.0, 16.0, 7.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005245208740234375, -0.0005087405443191528, -0.0004929602146148682, -0.0004771798849105835, -0.00046139955520629883, -0.00044561922550201416, -0.0004298388957977295, -0.0004140585660934448, -0.00039827823638916016, -0.0003824979066848755, -0.0003667175769805908, -0.00035093724727630615, -0.0003351569175720215, -0.0003193765878677368, -0.00030359625816345215, -0.0002878159284591675, -0.0002720355987548828, -0.00025625526905059814, -0.00024047493934631348, -0.0002246946096420288, -0.00020891427993774414, -0.00019313395023345947, -0.0001773536205291748, -0.00016157329082489014, -0.00014579296112060547, -0.0001300126314163208, -0.00011423230171203613, -9.845197200775146e-05, -8.26716423034668e-05, -6.689131259918213e-05, -5.111098289489746e-05, -3.533065319061279e-05, -1.9550323486328125e-05, -3.769993782043457e-06, 1.2010335922241211e-05, 2.779066562652588e-05, 4.357099533081055e-05, 5.9351325035095215e-05, 7.513165473937988e-05, 9.091198444366455e-05, 0.00010669231414794922, 0.0001224726438522339, 0.00013825297355651855, 0.00015403330326080322, 0.0001698136329650879, 0.00018559396266937256, 0.00020137429237365723, 0.0002171546220779419, 0.00023293495178222656, 0.00024871528148651123, 0.0002644956111907959, 0.00028027594089508057, 0.00029605627059936523, 0.0003118366003036499, 0.00032761693000793457, 0.00034339725971221924, 0.0003591775894165039, 0.0003749579191207886, 0.00039073824882507324, 0.0004065185785293579, 0.0004222989082336426, 0.00043807923793792725, 0.0004538595676422119, 0.0004696398973464966, 0.00048542022705078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 3.0, 11.0, 20.0, 28.0, 41.0, 70.0, 84.0, 158.0, 222.0, 423.0, 883.0, 1902.0, 4774.0, 14525.0, 58815.0, 381459.0, 484431.0, 73846.0, 17082.0, 5503.0, 2145.0, 945.0, 439.0, 278.0, 160.0, 97.0, 64.0, 52.0, 21.0, 14.0, 16.0, 7.0, 8.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.52056884765625, -5.3536376953125, -5.18670654296875, -5.019775390625, -4.85284423828125, -4.6859130859375, -4.51898193359375, -4.35205078125, -4.18511962890625, -4.0181884765625, -3.85125732421875, -3.684326171875, -3.51739501953125, -3.3504638671875, -3.18353271484375, -3.0166015625, -2.84967041015625, -2.6827392578125, -2.51580810546875, -2.348876953125, -2.18194580078125, -2.0150146484375, -1.84808349609375, -1.68115234375, -1.51422119140625, -1.3472900390625, -1.18035888671875, -1.013427734375, -0.84649658203125, -0.6795654296875, -0.51263427734375, -0.345703125, -0.17877197265625, -0.0118408203125, 0.15509033203125, 0.322021484375, 0.48895263671875, 0.6558837890625, 0.82281494140625, 0.98974609375, 1.15667724609375, 1.3236083984375, 1.49053955078125, 1.657470703125, 1.82440185546875, 1.9913330078125, 2.15826416015625, 2.3251953125, 2.49212646484375, 2.6590576171875, 2.82598876953125, 2.992919921875, 3.15985107421875, 3.3267822265625, 3.49371337890625, 3.66064453125, 3.82757568359375, 3.9945068359375, 4.16143798828125, 4.328369140625, 4.49530029296875, 4.6622314453125, 4.82916259765625, 4.99609375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 10.0, 12.0, 14.0, 17.0, 27.0, 40.0, 42.0, 96.0, 110.0, 154.0, 164.0, 107.0, 62.0, 33.0, 38.0, 24.0, 17.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.318359375, -3.210296630859375, -3.10223388671875, -2.994171142578125, -2.8861083984375, -2.778045654296875, -2.66998291015625, -2.561920166015625, -2.453857421875, -2.345794677734375, -2.23773193359375, -2.129669189453125, -2.0216064453125, -1.913543701171875, -1.80548095703125, -1.697418212890625, -1.58935546875, -1.481292724609375, -1.37322998046875, -1.265167236328125, -1.1571044921875, -1.049041748046875, -0.94097900390625, -0.832916259765625, -0.724853515625, -0.616790771484375, -0.50872802734375, -0.400665283203125, -0.2926025390625, -0.184539794921875, -0.07647705078125, 0.031585693359375, 0.1396484375, 0.247711181640625, 0.35577392578125, 0.463836669921875, 0.5718994140625, 0.679962158203125, 0.78802490234375, 0.896087646484375, 1.004150390625, 1.112213134765625, 1.22027587890625, 1.328338623046875, 1.4364013671875, 1.544464111328125, 1.65252685546875, 1.760589599609375, 1.86865234375, 1.976715087890625, 2.08477783203125, 2.192840576171875, 2.3009033203125, 2.408966064453125, 2.51702880859375, 2.625091552734375, 2.733154296875, 2.841217041015625, 2.94927978515625, 3.057342529296875, 3.1654052734375, 3.273468017578125, 3.38153076171875, 3.489593505859375, 3.59765625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 18.0, 16.0, 37.0, 50.0, 84.0, 130.0, 152.0, 145.0, 123.0, 95.0, 70.0, 24.0, 23.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.992528915405273, -27.789474487304688, -26.58641815185547, -25.383363723754883, -24.180307388305664, -22.977252960205078, -21.77419662475586, -20.571142196655273, -19.368087768554688, -18.1650333404541, -16.961977005004883, -15.758922576904297, -14.555866241455078, -13.352811813354492, -12.14975643157959, -10.946701049804688, -9.743644714355469, -8.540589332580566, -7.337533950805664, -6.13447904586792, -4.931423664093018, -3.7283682823181152, -2.525313377380371, -1.3222579956054688, -0.1192026138305664, 1.0838526487350464, 2.286907911300659, 3.4899630546569824, 4.693018436431885, 5.896073818206787, 7.099128723144531, 8.302184104919434, 9.505241394042969, 10.708296775817871, 11.911352157592773, 13.11440658569336, 14.317462921142578, 15.520517349243164, 16.72357177734375, 17.92662811279297, 19.129684448242188, 20.332738876342773, 21.535795211791992, 22.738849639892578, 23.941905975341797, 25.144960403442383, 26.34801483154297, 27.551071166992188, 28.754125595092773, 29.95718002319336, 31.160236358642578, 32.3632926940918, 33.56634521484375, 34.76940155029297, 35.97245788574219, 37.175514221191406, 38.37856674194336, 39.58162307739258, 40.78467559814453, 41.98773193359375, 43.19078826904297, 44.39384460449219, 45.59689712524414, 46.79995346069336, 48.00300979614258]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 9.0, 19.0, 11.0, 23.0, 26.0, 27.0, 42.0, 38.0, 53.0, 54.0, 50.0, 51.0, 53.0, 56.0, 46.0, 48.0, 59.0, 61.0, 41.0, 41.0, 35.0, 26.0, 17.0, 18.0, 20.0, 14.0, 20.0, 9.0, 9.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.384151458740234, -22.691268920898438, -21.99838638305664, -21.305503845214844, -20.61262321472168, -19.919740676879883, -19.226858139038086, -18.53397560119629, -17.841093063354492, -17.148210525512695, -16.4553279876709, -15.762446403503418, -15.069563865661621, -14.37668228149414, -13.683799743652344, -12.990917205810547, -12.298035621643066, -11.60515308380127, -10.912271499633789, -10.219388961791992, -9.526506423950195, -8.833623886108398, -8.140742301940918, -7.447859764099121, -6.754977703094482, -6.062095642089844, -5.369213104248047, -4.676331043243408, -3.9834487438201904, -3.2905664443969727, -2.597684383392334, -1.904801845550537, -1.2119197845458984, -0.5190375447273254, 0.17384469509124756, 0.8667268753051758, 1.5596091747283936, 2.2524914741516113, 2.94537353515625, 3.638256072998047, 4.3311381340026855, 5.024020195007324, 5.716902732849121, 6.40978479385376, 7.102666854858398, 7.795549392700195, 8.488431930541992, 9.181314468383789, 9.87419605255127, 10.567078590393066, 11.259960174560547, 11.952842712402344, 12.64572525024414, 13.338607788085938, 14.031489372253418, 14.724371910095215, 15.417253494262695, 16.110136032104492, 16.80301856994629, 17.495899200439453, 18.18878173828125, 18.881664276123047, 19.574546813964844, 20.26742935180664, 20.960311889648438]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 9.0, 8.0, 19.0, 25.0, 32.0, 87.0, 149.0, 323.0, 654.0, 1748.0, 4499.0, 14422.0, 55931.0, 394783.0, 3534513.0, 144071.0, 29701.0, 8430.0, 2874.0, 1070.0, 471.0, 186.0, 87.0, 56.0, 28.0, 26.0, 24.0, 11.0, 13.0, 10.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90234375, -3.69989013671875, -3.4974365234375, -3.29498291015625, -3.092529296875, -2.89007568359375, -2.6876220703125, -2.48516845703125, -2.28271484375, -2.08026123046875, -1.8778076171875, -1.67535400390625, -1.472900390625, -1.27044677734375, -1.0679931640625, -0.86553955078125, -0.6630859375, -0.46063232421875, -0.2581787109375, -0.05572509765625, 0.146728515625, 0.34918212890625, 0.5516357421875, 0.75408935546875, 0.95654296875, 1.15899658203125, 1.3614501953125, 1.56390380859375, 1.766357421875, 1.96881103515625, 2.1712646484375, 2.37371826171875, 2.576171875, 2.77862548828125, 2.9810791015625, 3.18353271484375, 3.385986328125, 3.58843994140625, 3.7908935546875, 3.99334716796875, 4.19580078125, 4.39825439453125, 4.6007080078125, 4.80316162109375, 5.005615234375, 5.20806884765625, 5.4105224609375, 5.61297607421875, 5.8154296875, 6.01788330078125, 6.2203369140625, 6.42279052734375, 6.625244140625, 6.82769775390625, 7.0301513671875, 7.23260498046875, 7.43505859375, 7.63751220703125, 7.8399658203125, 8.04241943359375, 8.244873046875, 8.44732666015625, 8.6497802734375, 8.85223388671875, 9.0546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 1.0, 2.0, 5.0, 3.0, 10.0, 7.0, 12.0, 13.0, 12.0, 27.0, 25.0, 24.0, 29.0, 43.0, 51.0, 47.0, 59.0, 44.0, 51.0, 62.0, 51.0, 53.0, 45.0, 48.0, 38.0, 36.0, 30.0, 31.0, 26.0, 24.0, 19.0, 15.0, 16.0, 11.0, 11.0, 7.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.61865234375, -0.6025772094726562, -0.5865020751953125, -0.5704269409179688, -0.554351806640625, -0.5382766723632812, -0.5222015380859375, -0.5061264038085938, -0.49005126953125, -0.47397613525390625, -0.4579010009765625, -0.44182586669921875, -0.425750732421875, -0.40967559814453125, -0.3936004638671875, -0.37752532958984375, -0.3614501953125, -0.34537506103515625, -0.3292999267578125, -0.31322479248046875, -0.297149658203125, -0.28107452392578125, -0.2649993896484375, -0.24892425537109375, -0.23284912109375, -0.21677398681640625, -0.2006988525390625, -0.18462371826171875, -0.168548583984375, -0.15247344970703125, -0.1363983154296875, -0.12032318115234375, -0.104248046875, -0.08817291259765625, -0.0720977783203125, -0.05602264404296875, -0.039947509765625, -0.02387237548828125, -0.0077972412109375, 0.00827789306640625, 0.02435302734375, 0.04042816162109375, 0.0565032958984375, 0.07257843017578125, 0.088653564453125, 0.10472869873046875, 0.1208038330078125, 0.13687896728515625, 0.1529541015625, 0.16902923583984375, 0.1851043701171875, 0.20117950439453125, 0.217254638671875, 0.23332977294921875, 0.2494049072265625, 0.26548004150390625, 0.28155517578125, 0.29763031005859375, 0.3137054443359375, 0.32978057861328125, 0.345855712890625, 0.36193084716796875, 0.3780059814453125, 0.39408111572265625, 0.41015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 3.0, 1.0, 6.0, 13.0, 18.0, 29.0, 45.0, 41.0, 97.0, 405.0, 4034.0, 109602.0, 4007787.0, 68621.0, 2943.0, 322.0, 102.0, 47.0, 47.0, 37.0, 32.0, 25.0, 9.0, 12.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-25.25, -24.706298828125, -24.16259765625, -23.618896484375, -23.0751953125, -22.531494140625, -21.98779296875, -21.444091796875, -20.900390625, -20.356689453125, -19.81298828125, -19.269287109375, -18.7255859375, -18.181884765625, -17.63818359375, -17.094482421875, -16.55078125, -16.007080078125, -15.46337890625, -14.919677734375, -14.3759765625, -13.832275390625, -13.28857421875, -12.744873046875, -12.201171875, -11.657470703125, -11.11376953125, -10.570068359375, -10.0263671875, -9.482666015625, -8.93896484375, -8.395263671875, -7.8515625, -7.307861328125, -6.76416015625, -6.220458984375, -5.6767578125, -5.133056640625, -4.58935546875, -4.045654296875, -3.501953125, -2.958251953125, -2.41455078125, -1.870849609375, -1.3271484375, -0.783447265625, -0.23974609375, 0.303955078125, 0.84765625, 1.391357421875, 1.93505859375, 2.478759765625, 3.0224609375, 3.566162109375, 4.10986328125, 4.653564453125, 5.197265625, 5.740966796875, 6.28466796875, 6.828369140625, 7.3720703125, 7.915771484375, 8.45947265625, 9.003173828125, 9.546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 12.0, 18.0, 25.0, 44.0, 74.0, 153.0, 282.0, 821.0, 1844.0, 376.0, 179.0, 89.0, 63.0, 38.0, 21.0, 15.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98779296875, -0.9227981567382812, -0.8578033447265625, -0.7928085327148438, -0.727813720703125, -0.6628189086914062, -0.5978240966796875, -0.5328292846679688, -0.46783447265625, -0.40283966064453125, -0.3378448486328125, -0.27285003662109375, -0.207855224609375, -0.14286041259765625, -0.0778656005859375, -0.01287078857421875, 0.0521240234375, 0.11711883544921875, 0.1821136474609375, 0.24710845947265625, 0.312103271484375, 0.37709808349609375, 0.4420928955078125, 0.5070877075195312, 0.57208251953125, 0.6370773315429688, 0.7020721435546875, 0.7670669555664062, 0.832061767578125, 0.8970565795898438, 0.9620513916015625, 1.0270462036132812, 1.092041015625, 1.1570358276367188, 1.2220306396484375, 1.2870254516601562, 1.352020263671875, 1.4170150756835938, 1.4820098876953125, 1.5470046997070312, 1.61199951171875, 1.6769943237304688, 1.7419891357421875, 1.8069839477539062, 1.871978759765625, 1.9369735717773438, 2.0019683837890625, 2.0669631958007812, 2.1319580078125, 2.1969528198242188, 2.2619476318359375, 2.3269424438476562, 2.391937255859375, 2.4569320678710938, 2.5219268798828125, 2.5869216918945312, 2.65191650390625, 2.7169113159179688, 2.7819061279296875, 2.8469009399414062, 2.911895751953125, 2.9768905639648438, 3.0418853759765625, 3.1068801879882812, 3.171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 12.0, 14.0, 30.0, 76.0, 91.0, 157.0, 161.0, 185.0, 110.0, 70.0, 36.0, 29.0, 16.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.15162181854248, -11.768546104431152, -11.385470390319824, -11.002394676208496, -10.619318962097168, -10.23624324798584, -9.853168487548828, -9.4700927734375, -9.087017059326172, -8.703941345214844, -8.320865631103516, -7.9377899169921875, -7.554714202880859, -7.171638488769531, -6.788563251495361, -6.405487537384033, -6.022411346435547, -5.639335632324219, -5.256259918212891, -4.8731842041015625, -4.490108489990234, -4.107032775878906, -3.7239575386047363, -3.340881824493408, -2.95780611038208, -2.574730396270752, -2.191654682159424, -1.8085792064666748, -1.4255034923553467, -1.0424277782440186, -0.6593523025512695, -0.2762765884399414, 0.10680007934570312, 0.4898757338523865, 0.8729513883590698, 1.2560269832611084, 1.6391026973724365, 2.0221784114837646, 2.4052538871765137, 2.788329601287842, 3.17140531539917, 3.554481029510498, 3.937556743621826, 4.320631980895996, 4.703707695007324, 5.086783409118652, 5.4698591232299805, 5.852934837341309, 6.236010551452637, 6.619086265563965, 7.002161979675293, 7.385237693786621, 7.768313407897949, 8.151389122009277, 8.534463882446289, 8.917539596557617, 9.300615310668945, 9.683691024780273, 10.066766738891602, 10.44984245300293, 10.832918167114258, 11.215993881225586, 11.599069595336914, 11.982145309448242, 12.36522102355957]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 3.0, 10.0, 9.0, 10.0, 14.0, 18.0, 15.0, 14.0, 19.0, 21.0, 27.0, 29.0, 34.0, 30.0, 31.0, 41.0, 46.0, 39.0, 36.0, 49.0, 38.0, 52.0, 36.0, 37.0, 29.0, 36.0, 35.0, 30.0, 33.0, 31.0, 22.0, 21.0, 15.0, 11.0, 17.0, 8.0, 5.0, 6.0, 5.0, 6.0, 2.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.8206100463867188, -3.696869134902954, -3.5731284618377686, -3.449387550354004, -3.3256466388702393, -3.2019057273864746, -3.078165054321289, -2.9544241428375244, -2.8306832313537598, -2.706942319869995, -2.5832016468048096, -2.459460735321045, -2.3357198238372803, -2.2119789123535156, -2.08823823928833, -1.9644973278045654, -1.8407566547393799, -1.7170158624649048, -1.5932749509811401, -1.469534158706665, -1.3457932472229004, -1.2220524549484253, -1.0983116626739502, -0.9745708107948303, -0.8508299589157104, -0.7270891070365906, -0.6033482551574707, -0.4796074628829956, -0.35586661100387573, -0.23212575912475586, -0.10838496685028076, 0.015355885028839111, 0.13909673690795898, 0.26283758878707886, 0.38657841086387634, 0.5103192329406738, 0.6340600848197937, 0.7578009366989136, 0.8815417289733887, 1.0052826404571533, 1.1290234327316284, 1.2527642250061035, 1.3765051364898682, 1.5002459287643433, 1.6239867210388184, 1.747727632522583, 1.871468424797058, 1.9952092170715332, 2.118950128555298, 2.2426910400390625, 2.366431713104248, 2.4901726245880127, 2.6139135360717773, 2.737654209136963, 2.8613951206207275, 2.985136032104492, 3.1088767051696777, 3.2326176166534424, 3.356358289718628, 3.4800992012023926, 3.6038401126861572, 3.727581024169922, 3.8513216972351074, 3.975062608718872, 4.098803520202637]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 1.0, 4.0, 5.0, 6.0, 9.0, 7.0, 18.0, 29.0, 49.0, 65.0, 126.0, 185.0, 354.0, 585.0, 1090.0, 2266.0, 4312.0, 8603.0, 18058.0, 37500.0, 80196.0, 163433.0, 274684.0, 227784.0, 119114.0, 57057.0, 27206.0, 12835.0, 6243.0, 3184.0, 1570.0, 794.0, 499.0, 236.0, 147.0, 94.0, 64.0, 38.0, 30.0, 28.0, 7.0, 11.0, 9.0, 4.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.81640625, -2.73541259765625, -2.6544189453125, -2.57342529296875, -2.492431640625, -2.41143798828125, -2.3304443359375, -2.24945068359375, -2.16845703125, -2.08746337890625, -2.0064697265625, -1.92547607421875, -1.844482421875, -1.76348876953125, -1.6824951171875, -1.60150146484375, -1.5205078125, -1.43951416015625, -1.3585205078125, -1.27752685546875, -1.196533203125, -1.11553955078125, -1.0345458984375, -0.95355224609375, -0.87255859375, -0.79156494140625, -0.7105712890625, -0.62957763671875, -0.548583984375, -0.46759033203125, -0.3865966796875, -0.30560302734375, -0.224609375, -0.14361572265625, -0.0626220703125, 0.01837158203125, 0.099365234375, 0.18035888671875, 0.2613525390625, 0.34234619140625, 0.42333984375, 0.50433349609375, 0.5853271484375, 0.66632080078125, 0.747314453125, 0.82830810546875, 0.9093017578125, 0.99029541015625, 1.0712890625, 1.15228271484375, 1.2332763671875, 1.31427001953125, 1.395263671875, 1.47625732421875, 1.5572509765625, 1.63824462890625, 1.71923828125, 1.80023193359375, 1.8812255859375, 1.96221923828125, 2.043212890625, 2.12420654296875, 2.2052001953125, 2.28619384765625, 2.3671875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 16.0, 15.0, 17.0, 22.0, 23.0, 23.0, 28.0, 41.0, 40.0, 45.0, 31.0, 45.0, 62.0, 52.0, 61.0, 61.0, 50.0, 49.0, 45.0, 43.0, 34.0, 31.0, 34.0, 17.0, 26.0, 10.0, 11.0, 11.0, 8.0, 11.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65673828125, -0.6398544311523438, -0.6229705810546875, -0.6060867309570312, -0.589202880859375, -0.5723190307617188, -0.5554351806640625, -0.5385513305664062, -0.52166748046875, -0.5047836303710938, -0.4878997802734375, -0.47101593017578125, -0.454132080078125, -0.43724822998046875, -0.4203643798828125, -0.40348052978515625, -0.3865966796875, -0.36971282958984375, -0.3528289794921875, -0.33594512939453125, -0.319061279296875, -0.30217742919921875, -0.2852935791015625, -0.26840972900390625, -0.25152587890625, -0.23464202880859375, -0.2177581787109375, -0.20087432861328125, -0.183990478515625, -0.16710662841796875, -0.1502227783203125, -0.13333892822265625, -0.116455078125, -0.09957122802734375, -0.0826873779296875, -0.06580352783203125, -0.048919677734375, -0.03203582763671875, -0.0151519775390625, 0.00173187255859375, 0.01861572265625, 0.03549957275390625, 0.0523834228515625, 0.06926727294921875, 0.086151123046875, 0.10303497314453125, 0.1199188232421875, 0.13680267333984375, 0.1536865234375, 0.17057037353515625, 0.1874542236328125, 0.20433807373046875, 0.221221923828125, 0.23810577392578125, 0.2549896240234375, 0.27187347412109375, 0.28875732421875, 0.30564117431640625, 0.3225250244140625, 0.33940887451171875, 0.356292724609375, 0.37317657470703125, 0.3900604248046875, 0.40694427490234375, 0.423828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 6.0, 8.0, 13.0, 19.0, 30.0, 54.0, 54.0, 89.0, 136.0, 223.0, 369.0, 686.0, 1320.0, 3029.0, 8625.0, 27729.0, 94992.0, 284659.0, 391766.0, 162311.0, 49041.0, 14392.0, 4877.0, 1899.0, 890.0, 495.0, 303.0, 162.0, 109.0, 95.0, 43.0, 33.0, 25.0, 17.0, 14.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.2578125, -4.140289306640625, -4.02276611328125, -3.905242919921875, -3.7877197265625, -3.670196533203125, -3.55267333984375, -3.435150146484375, -3.317626953125, -3.200103759765625, -3.08258056640625, -2.965057373046875, -2.8475341796875, -2.730010986328125, -2.61248779296875, -2.494964599609375, -2.37744140625, -2.259918212890625, -2.14239501953125, -2.024871826171875, -1.9073486328125, -1.789825439453125, -1.67230224609375, -1.554779052734375, -1.437255859375, -1.319732666015625, -1.20220947265625, -1.084686279296875, -0.9671630859375, -0.849639892578125, -0.73211669921875, -0.614593505859375, -0.4970703125, -0.379547119140625, -0.26202392578125, -0.144500732421875, -0.0269775390625, 0.090545654296875, 0.20806884765625, 0.325592041015625, 0.443115234375, 0.560638427734375, 0.67816162109375, 0.795684814453125, 0.9132080078125, 1.030731201171875, 1.14825439453125, 1.265777587890625, 1.38330078125, 1.500823974609375, 1.61834716796875, 1.735870361328125, 1.8533935546875, 1.970916748046875, 2.08843994140625, 2.205963134765625, 2.323486328125, 2.441009521484375, 2.55853271484375, 2.676055908203125, 2.7935791015625, 2.911102294921875, 3.02862548828125, 3.146148681640625, 3.263671875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 8.0, 7.0, 5.0, 17.0, 12.0, 26.0, 13.0, 29.0, 34.0, 34.0, 37.0, 40.0, 28.0, 41.0, 41.0, 56.0, 56.0, 42.0, 45.0, 43.0, 49.0, 43.0, 36.0, 40.0, 34.0, 30.0, 30.0, 23.0, 18.0, 20.0, 11.0, 12.0, 10.0, 10.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.307220458984375, -2.22772216796875, -2.148223876953125, -2.0687255859375, -1.989227294921875, -1.90972900390625, -1.830230712890625, -1.750732421875, -1.671234130859375, -1.59173583984375, -1.512237548828125, -1.4327392578125, -1.353240966796875, -1.27374267578125, -1.194244384765625, -1.11474609375, -1.035247802734375, -0.95574951171875, -0.876251220703125, -0.7967529296875, -0.717254638671875, -0.63775634765625, -0.558258056640625, -0.478759765625, -0.399261474609375, -0.31976318359375, -0.240264892578125, -0.1607666015625, -0.081268310546875, -0.00177001953125, 0.077728271484375, 0.1572265625, 0.236724853515625, 0.31622314453125, 0.395721435546875, 0.4752197265625, 0.554718017578125, 0.63421630859375, 0.713714599609375, 0.793212890625, 0.872711181640625, 0.95220947265625, 1.031707763671875, 1.1112060546875, 1.190704345703125, 1.27020263671875, 1.349700927734375, 1.42919921875, 1.508697509765625, 1.58819580078125, 1.667694091796875, 1.7471923828125, 1.826690673828125, 1.90618896484375, 1.985687255859375, 2.065185546875, 2.144683837890625, 2.22418212890625, 2.303680419921875, 2.3831787109375, 2.462677001953125, 2.54217529296875, 2.621673583984375, 2.701171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 8.0, 11.0, 11.0, 13.0, 30.0, 25.0, 36.0, 58.0, 89.0, 157.0, 338.0, 646.0, 1666.0, 5108.0, 21961.0, 156558.0, 680565.0, 151752.0, 21382.0, 5039.0, 1661.0, 674.0, 311.0, 147.0, 103.0, 56.0, 45.0, 27.0, 13.0, 12.0, 10.0, 10.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.74609375, -3.634246826171875, -3.52239990234375, -3.410552978515625, -3.2987060546875, -3.186859130859375, -3.07501220703125, -2.963165283203125, -2.851318359375, -2.739471435546875, -2.62762451171875, -2.515777587890625, -2.4039306640625, -2.292083740234375, -2.18023681640625, -2.068389892578125, -1.95654296875, -1.844696044921875, -1.73284912109375, -1.621002197265625, -1.5091552734375, -1.397308349609375, -1.28546142578125, -1.173614501953125, -1.061767578125, -0.949920654296875, -0.83807373046875, -0.726226806640625, -0.6143798828125, -0.502532958984375, -0.39068603515625, -0.278839111328125, -0.1669921875, -0.055145263671875, 0.05670166015625, 0.168548583984375, 0.2803955078125, 0.392242431640625, 0.50408935546875, 0.615936279296875, 0.727783203125, 0.839630126953125, 0.95147705078125, 1.063323974609375, 1.1751708984375, 1.287017822265625, 1.39886474609375, 1.510711669921875, 1.62255859375, 1.734405517578125, 1.84625244140625, 1.958099365234375, 2.0699462890625, 2.181793212890625, 2.29364013671875, 2.405487060546875, 2.517333984375, 2.629180908203125, 2.74102783203125, 2.852874755859375, 2.9647216796875, 3.076568603515625, 3.18841552734375, 3.300262451171875, 3.412109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 1.0, 7.0, 6.0, 7.0, 9.0, 13.0, 7.0, 21.0, 25.0, 32.0, 37.0, 66.0, 107.0, 132.0, 140.0, 117.0, 82.0, 43.0, 41.0, 33.0, 18.0, 16.0, 14.0, 10.0, 6.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0006384849548339844, -0.0006229914724826813, -0.0006074979901313782, -0.0005920045077800751, -0.000576511025428772, -0.0005610175430774689, -0.0005455240607261658, -0.0005300305783748627, -0.0005145370960235596, -0.0004990436136722565, -0.00048355013132095337, -0.00046805664896965027, -0.00045256316661834717, -0.00043706968426704407, -0.00042157620191574097, -0.00040608271956443787, -0.00039058923721313477, -0.00037509575486183167, -0.00035960227251052856, -0.00034410879015922546, -0.00032861530780792236, -0.00031312182545661926, -0.00029762834310531616, -0.00028213486075401306, -0.00026664137840270996, -0.00025114789605140686, -0.00023565441370010376, -0.00022016093134880066, -0.00020466744899749756, -0.00018917396664619446, -0.00017368048429489136, -0.00015818700194358826, -0.00014269351959228516, -0.00012720003724098206, -0.00011170655488967896, -9.621307253837585e-05, -8.071959018707275e-05, -6.522610783576965e-05, -4.973262548446655e-05, -3.423914313316345e-05, -1.874566078186035e-05, -3.252178430557251e-06, 1.224130392074585e-05, 2.773478627204895e-05, 4.322826862335205e-05, 5.872175097465515e-05, 7.421523332595825e-05, 8.970871567726135e-05, 0.00010520219802856445, 0.00012069568037986755, 0.00013618916273117065, 0.00015168264508247375, 0.00016717612743377686, 0.00018266960978507996, 0.00019816309213638306, 0.00021365657448768616, 0.00022915005683898926, 0.00024464353919029236, 0.00026013702154159546, 0.00027563050389289856, 0.00029112398624420166, 0.00030661746859550476, 0.00032211095094680786, 0.00033760443329811096, 0.00035309791564941406]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 9.0, 12.0, 13.0, 17.0, 22.0, 32.0, 52.0, 67.0, 97.0, 205.0, 308.0, 577.0, 1097.0, 2271.0, 5475.0, 16412.0, 61106.0, 327984.0, 497635.0, 97817.0, 23773.0, 7597.0, 2989.0, 1357.0, 637.0, 361.0, 210.0, 146.0, 72.0, 44.0, 29.0, 32.0, 13.0, 18.0, 9.0, 14.0, 3.0, 7.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-3.08984375, -2.99664306640625, -2.9034423828125, -2.81024169921875, -2.717041015625, -2.62384033203125, -2.5306396484375, -2.43743896484375, -2.34423828125, -2.25103759765625, -2.1578369140625, -2.06463623046875, -1.971435546875, -1.87823486328125, -1.7850341796875, -1.69183349609375, -1.5986328125, -1.50543212890625, -1.4122314453125, -1.31903076171875, -1.225830078125, -1.13262939453125, -1.0394287109375, -0.94622802734375, -0.85302734375, -0.75982666015625, -0.6666259765625, -0.57342529296875, -0.480224609375, -0.38702392578125, -0.2938232421875, -0.20062255859375, -0.107421875, -0.01422119140625, 0.0789794921875, 0.17218017578125, 0.265380859375, 0.35858154296875, 0.4517822265625, 0.54498291015625, 0.63818359375, 0.73138427734375, 0.8245849609375, 0.91778564453125, 1.010986328125, 1.10418701171875, 1.1973876953125, 1.29058837890625, 1.3837890625, 1.47698974609375, 1.5701904296875, 1.66339111328125, 1.756591796875, 1.84979248046875, 1.9429931640625, 2.03619384765625, 2.12939453125, 2.22259521484375, 2.3157958984375, 2.40899658203125, 2.502197265625, 2.59539794921875, 2.6885986328125, 2.78179931640625, 2.875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 11.0, 8.0, 10.0, 10.0, 22.0, 20.0, 25.0, 35.0, 45.0, 50.0, 57.0, 77.0, 74.0, 84.0, 83.0, 81.0, 61.0, 51.0, 35.0, 29.0, 27.0, 21.0, 12.0, 11.0, 11.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.13671875, -1.09326171875, -1.0498046875, -1.00634765625, -0.962890625, -0.91943359375, -0.8759765625, -0.83251953125, -0.7890625, -0.74560546875, -0.7021484375, -0.65869140625, -0.615234375, -0.57177734375, -0.5283203125, -0.48486328125, -0.44140625, -0.39794921875, -0.3544921875, -0.31103515625, -0.267578125, -0.22412109375, -0.1806640625, -0.13720703125, -0.09375, -0.05029296875, -0.0068359375, 0.03662109375, 0.080078125, 0.12353515625, 0.1669921875, 0.21044921875, 0.25390625, 0.29736328125, 0.3408203125, 0.38427734375, 0.427734375, 0.47119140625, 0.5146484375, 0.55810546875, 0.6015625, 0.64501953125, 0.6884765625, 0.73193359375, 0.775390625, 0.81884765625, 0.8623046875, 0.90576171875, 0.94921875, 0.99267578125, 1.0361328125, 1.07958984375, 1.123046875, 1.16650390625, 1.2099609375, 1.25341796875, 1.296875, 1.34033203125, 1.3837890625, 1.42724609375, 1.470703125, 1.51416015625, 1.5576171875, 1.60107421875, 1.64453125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 3.0, 20.0, 45.0, 64.0, 105.0, 161.0, 208.0, 166.0, 98.0, 57.0, 40.0, 14.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.03725814819336, -35.86587905883789, -34.69449996948242, -33.52312088012695, -32.351741790771484, -31.180362701416016, -30.008983612060547, -28.837604522705078, -27.66622543334961, -26.49484634399414, -25.323467254638672, -24.152088165283203, -22.980709075927734, -21.809329986572266, -20.637950897216797, -19.466571807861328, -18.29519271850586, -17.12381362915039, -15.952434539794922, -14.781055450439453, -13.609676361083984, -12.438297271728516, -11.266918182373047, -10.095539093017578, -8.92416000366211, -7.752780914306641, -6.581401824951172, -5.410022735595703, -4.238643646240234, -3.0672645568847656, -1.8958854675292969, -0.7245063781738281, 0.4468727111816406, 1.6182518005371094, 2.789630889892578, 3.961009979248047, 5.132389068603516, 6.303768157958984, 7.475147247314453, 8.646526336669922, 9.81790542602539, 10.98928451538086, 12.160663604736328, 13.332042694091797, 14.503421783447266, 15.674800872802734, 16.846179962158203, 18.017559051513672, 19.18893814086914, 20.36031723022461, 21.531696319580078, 22.703075408935547, 23.874454498291016, 25.045833587646484, 26.217212677001953, 27.388591766357422, 28.55997085571289, 29.73134994506836, 30.902729034423828, 32.0741081237793, 33.245487213134766, 34.416866302490234, 35.5882453918457, 36.75962448120117, 37.93100357055664]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 6.0, 12.0, 9.0, 21.0, 20.0, 27.0, 29.0, 29.0, 40.0, 45.0, 44.0, 49.0, 52.0, 46.0, 57.0, 37.0, 55.0, 54.0, 35.0, 51.0, 42.0, 39.0, 40.0, 25.0, 25.0, 28.0, 9.0, 15.0, 16.0, 9.0, 5.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.891378402709961, -12.398017883300781, -11.904656410217285, -11.411295890808105, -10.917935371398926, -10.42457389831543, -9.93121337890625, -9.43785285949707, -8.94449234008789, -8.451131820678711, -7.957770824432373, -7.464409828186035, -6.9710493087768555, -6.477688312530518, -5.98432731628418, -5.490966796875, -4.997605800628662, -4.504244804382324, -4.0108842849731445, -3.5175232887268066, -3.024162769317627, -2.530801773071289, -2.0374410152435303, -1.5440802574157715, -1.0507194995880127, -0.5573587417602539, -0.06399792432785034, 0.4293628931045532, 0.922723650932312, 1.4160845279693604, 1.9094452857971191, 2.402806043624878, 2.8961668014526367, 3.3895275592803955, 3.8828883171081543, 4.376249313354492, 4.869609832763672, 5.36297082901001, 5.856331825256348, 6.349692344665527, 6.843052864074707, 7.336413860321045, 7.829774379730225, 8.323135375976562, 8.816495895385742, 9.309856414794922, 9.803217887878418, 10.296578407287598, 10.789939880371094, 11.283300399780273, 11.77666187286377, 12.27002239227295, 12.763382911682129, 13.256744384765625, 13.750104904174805, 14.243465423583984, 14.736825942993164, 15.230186462402344, 15.72354793548584, 16.216907501220703, 16.710269927978516, 17.203630447387695, 17.696990966796875, 18.190351486206055, 18.683712005615234]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 12.0, 22.0, 17.0, 32.0, 50.0, 67.0, 99.0, 198.0, 302.0, 532.0, 1059.0, 2155.0, 4679.0, 10355.0, 25797.0, 85425.0, 812958.0, 3089362.0, 108927.0, 30948.0, 11634.0, 4903.0, 2301.0, 1105.0, 529.0, 331.0, 157.0, 94.0, 82.0, 53.0, 25.0, 17.0, 12.0, 10.0, 10.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.103515625, -2.974639892578125, -2.84576416015625, -2.716888427734375, -2.5880126953125, -2.459136962890625, -2.33026123046875, -2.201385498046875, -2.072509765625, -1.943634033203125, -1.81475830078125, -1.685882568359375, -1.5570068359375, -1.428131103515625, -1.29925537109375, -1.170379638671875, -1.04150390625, -0.912628173828125, -0.78375244140625, -0.654876708984375, -0.5260009765625, -0.397125244140625, -0.26824951171875, -0.139373779296875, -0.010498046875, 0.118377685546875, 0.24725341796875, 0.376129150390625, 0.5050048828125, 0.633880615234375, 0.76275634765625, 0.891632080078125, 1.0205078125, 1.149383544921875, 1.27825927734375, 1.407135009765625, 1.5360107421875, 1.664886474609375, 1.79376220703125, 1.922637939453125, 2.051513671875, 2.180389404296875, 2.30926513671875, 2.438140869140625, 2.5670166015625, 2.695892333984375, 2.82476806640625, 2.953643798828125, 3.08251953125, 3.211395263671875, 3.34027099609375, 3.469146728515625, 3.5980224609375, 3.726898193359375, 3.85577392578125, 3.984649658203125, 4.113525390625, 4.242401123046875, 4.37127685546875, 4.500152587890625, 4.6290283203125, 4.757904052734375, 4.88677978515625, 5.015655517578125, 5.14453125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 10.0, 15.0, 13.0, 19.0, 13.0, 23.0, 39.0, 32.0, 39.0, 47.0, 48.0, 54.0, 84.0, 51.0, 64.0, 74.0, 68.0, 54.0, 55.0, 41.0, 33.0, 29.0, 24.0, 15.0, 19.0, 13.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7667236328125, -0.745849609375, -0.7249755859375, -0.7041015625, -0.6832275390625, -0.662353515625, -0.6414794921875, -0.62060546875, -0.5997314453125, -0.578857421875, -0.5579833984375, -0.537109375, -0.5162353515625, -0.495361328125, -0.4744873046875, -0.45361328125, -0.4327392578125, -0.411865234375, -0.3909912109375, -0.3701171875, -0.3492431640625, -0.328369140625, -0.3074951171875, -0.28662109375, -0.2657470703125, -0.244873046875, -0.2239990234375, -0.203125, -0.1822509765625, -0.161376953125, -0.1405029296875, -0.11962890625, -0.0987548828125, -0.077880859375, -0.0570068359375, -0.0361328125, -0.0152587890625, 0.005615234375, 0.0264892578125, 0.04736328125, 0.0682373046875, 0.089111328125, 0.1099853515625, 0.130859375, 0.1517333984375, 0.172607421875, 0.1934814453125, 0.21435546875, 0.2352294921875, 0.256103515625, 0.2769775390625, 0.2978515625, 0.3187255859375, 0.339599609375, 0.3604736328125, 0.38134765625, 0.4022216796875, 0.423095703125, 0.4439697265625, 0.46484375, 0.4857177734375, 0.506591796875, 0.5274658203125, 0.54833984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 11.0, 23.0, 26.0, 50.0, 98.0, 168.0, 332.0, 625.0, 1199.0, 2334.0, 5239.0, 12961.0, 37387.0, 126884.0, 878239.0, 2861244.0, 188233.0, 49607.0, 16954.0, 6616.0, 3084.0, 1442.0, 733.0, 382.0, 187.0, 113.0, 42.0, 28.0, 18.0, 9.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.06640625, -4.9461669921875, -4.825927734375, -4.7056884765625, -4.58544921875, -4.4652099609375, -4.344970703125, -4.2247314453125, -4.1044921875, -3.9842529296875, -3.864013671875, -3.7437744140625, -3.62353515625, -3.5032958984375, -3.383056640625, -3.2628173828125, -3.142578125, -3.0223388671875, -2.902099609375, -2.7818603515625, -2.66162109375, -2.5413818359375, -2.421142578125, -2.3009033203125, -2.1806640625, -2.0604248046875, -1.940185546875, -1.8199462890625, -1.69970703125, -1.5794677734375, -1.459228515625, -1.3389892578125, -1.21875, -1.0985107421875, -0.978271484375, -0.8580322265625, -0.73779296875, -0.6175537109375, -0.497314453125, -0.3770751953125, -0.2568359375, -0.1365966796875, -0.016357421875, 0.1038818359375, 0.22412109375, 0.3443603515625, 0.464599609375, 0.5848388671875, 0.705078125, 0.8253173828125, 0.945556640625, 1.0657958984375, 1.18603515625, 1.3062744140625, 1.426513671875, 1.5467529296875, 1.6669921875, 1.7872314453125, 1.907470703125, 2.0277099609375, 2.14794921875, 2.2681884765625, 2.388427734375, 2.5086669921875, 2.62890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 15.0, 17.0, 10.0, 13.0, 22.0, 33.0, 51.0, 66.0, 80.0, 111.0, 174.0, 282.0, 776.0, 1363.0, 393.0, 179.0, 109.0, 87.0, 55.0, 53.0, 38.0, 27.0, 27.0, 8.0, 11.0, 8.0, 9.0, 7.0, 6.0, 2.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.86328125, -0.8346633911132812, -0.8060455322265625, -0.7774276733398438, -0.748809814453125, -0.7201919555664062, -0.6915740966796875, -0.6629562377929688, -0.63433837890625, -0.6057205200195312, -0.5771026611328125, -0.5484848022460938, -0.519866943359375, -0.49124908447265625, -0.4626312255859375, -0.43401336669921875, -0.4053955078125, -0.37677764892578125, -0.3481597900390625, -0.31954193115234375, -0.290924072265625, -0.26230621337890625, -0.2336883544921875, -0.20507049560546875, -0.17645263671875, -0.14783477783203125, -0.1192169189453125, -0.09059906005859375, -0.061981201171875, -0.03336334228515625, -0.0047454833984375, 0.02387237548828125, 0.052490234375, 0.08110809326171875, 0.1097259521484375, 0.13834381103515625, 0.166961669921875, 0.19557952880859375, 0.2241973876953125, 0.25281524658203125, 0.28143310546875, 0.31005096435546875, 0.3386688232421875, 0.36728668212890625, 0.395904541015625, 0.42452239990234375, 0.4531402587890625, 0.48175811767578125, 0.5103759765625, 0.5389938354492188, 0.5676116943359375, 0.5962295532226562, 0.624847412109375, 0.6534652709960938, 0.6820831298828125, 0.7107009887695312, 0.73931884765625, 0.7679367065429688, 0.7965545654296875, 0.8251724243164062, 0.853790283203125, 0.8824081420898438, 0.9110260009765625, 0.9396438598632812, 0.96826171875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 14.0, 26.0, 52.0, 78.0, 135.0, 149.0, 160.0, 128.0, 99.0, 65.0, 37.0, 22.0, 12.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.186822891235352, -7.87867546081543, -7.570528030395508, -7.262380599975586, -6.954233169555664, -6.646085739135742, -6.337937831878662, -6.02979040145874, -5.721642971038818, -5.4134955406188965, -5.105348110198975, -4.797200679779053, -4.489052772521973, -4.180905342102051, -3.872757911682129, -3.564610481262207, -3.256463050842285, -2.9483156204223633, -2.6401681900024414, -2.3320205211639404, -2.0238730907440186, -1.7157256603240967, -1.4075781106948853, -1.0994305610656738, -0.791283130645752, -0.4831356406211853, -0.17498815059661865, 0.133159339427948, 0.44130682945251465, 0.7494542598724365, 1.057601809501648, 1.3657493591308594, 1.6738967895507812, 1.9820442199707031, 2.290191650390625, 2.598339319229126, 2.906486749649048, 3.2146341800689697, 3.5227818489074707, 3.8309292793273926, 4.1390767097473145, 4.447224140167236, 4.755371570587158, 5.06351900100708, 5.37166690826416, 5.679814338684082, 5.987961769104004, 6.296109199523926, 6.604256629943848, 6.9124040603637695, 7.220551490783691, 7.528698921203613, 7.836846351623535, 8.144993782043457, 8.453141212463379, 8.761289596557617, 9.069437026977539, 9.377584457397461, 9.685731887817383, 9.993879318237305, 10.302026748657227, 10.610174179077148, 10.91832160949707, 11.226469039916992, 11.534616470336914]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 2.0, 9.0, 10.0, 7.0, 10.0, 8.0, 3.0, 13.0, 11.0, 19.0, 29.0, 30.0, 28.0, 23.0, 34.0, 36.0, 31.0, 46.0, 25.0, 32.0, 48.0, 42.0, 44.0, 51.0, 31.0, 35.0, 42.0, 43.0, 29.0, 27.0, 33.0, 25.0, 26.0, 17.0, 11.0, 19.0, 24.0, 9.0, 5.0, 6.0, 7.0, 4.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-3.6991701126098633, -3.5904452800750732, -3.481720447540283, -3.3729958534240723, -3.2642710208892822, -3.155546188354492, -3.046821355819702, -2.938096523284912, -2.829371929168701, -2.720647096633911, -2.611922264099121, -2.50319766998291, -2.39447283744812, -2.28574800491333, -2.17702317237854, -2.06829833984375, -1.95957350730896, -1.85084867477417, -1.7421239614486694, -1.6333991289138794, -1.524674415588379, -1.4159495830535889, -1.3072247505187988, -1.1984999179840088, -1.0897752046585083, -0.981050431728363, -0.8723256587982178, -0.7636008262634277, -0.6548760533332825, -0.5461512804031372, -0.43742644786834717, -0.3287016749382019, -0.21997690200805664, -0.11125211417675018, -0.0025273263454437256, 0.10619747638702393, 0.2149222493171692, 0.32364702224731445, 0.4323718547821045, 0.5410966277122498, 0.649821400642395, 0.7585461735725403, 0.8672709465026855, 0.9759957790374756, 1.0847206115722656, 1.1934453248977661, 1.3021701574325562, 1.4108948707580566, 1.5196197032928467, 1.6283445358276367, 1.7370692491531372, 1.8457940816879272, 1.9545187950134277, 2.0632436275482178, 2.171968460083008, 2.280693292617798, 2.389418125152588, 2.498142957687378, 2.606867790222168, 2.715592384338379, 2.824317216873169, 2.933042049407959, 3.041766881942749, 3.150491714477539, 3.25921630859375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 11.0, 5.0, 24.0, 21.0, 32.0, 43.0, 86.0, 128.0, 220.0, 340.0, 616.0, 1068.0, 1967.0, 3835.0, 7385.0, 14819.0, 31087.0, 67393.0, 142360.0, 255440.0, 252381.0, 141291.0, 66698.0, 31198.0, 14684.0, 7258.0, 3614.0, 1983.0, 1065.0, 617.0, 341.0, 184.0, 129.0, 63.0, 48.0, 36.0, 29.0, 12.0, 12.0, 6.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.435546875, -2.361724853515625, -2.28790283203125, -2.214080810546875, -2.1402587890625, -2.066436767578125, -1.99261474609375, -1.918792724609375, -1.844970703125, -1.771148681640625, -1.69732666015625, -1.623504638671875, -1.5496826171875, -1.475860595703125, -1.40203857421875, -1.328216552734375, -1.25439453125, -1.180572509765625, -1.10675048828125, -1.032928466796875, -0.9591064453125, -0.885284423828125, -0.81146240234375, -0.737640380859375, -0.663818359375, -0.589996337890625, -0.51617431640625, -0.442352294921875, -0.3685302734375, -0.294708251953125, -0.22088623046875, -0.147064208984375, -0.0732421875, 0.000579833984375, 0.07440185546875, 0.148223876953125, 0.2220458984375, 0.295867919921875, 0.36968994140625, 0.443511962890625, 0.517333984375, 0.591156005859375, 0.66497802734375, 0.738800048828125, 0.8126220703125, 0.886444091796875, 0.96026611328125, 1.034088134765625, 1.10791015625, 1.181732177734375, 1.25555419921875, 1.329376220703125, 1.4031982421875, 1.477020263671875, 1.55084228515625, 1.624664306640625, 1.698486328125, 1.772308349609375, 1.84613037109375, 1.919952392578125, 1.9937744140625, 2.067596435546875, 2.14141845703125, 2.215240478515625, 2.2890625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 10.0, 9.0, 7.0, 9.0, 16.0, 22.0, 24.0, 25.0, 41.0, 39.0, 46.0, 37.0, 52.0, 56.0, 63.0, 49.0, 57.0, 56.0, 78.0, 57.0, 52.0, 43.0, 33.0, 29.0, 21.0, 17.0, 16.0, 12.0, 9.0, 8.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76318359375, -0.7428054809570312, -0.7224273681640625, -0.7020492553710938, -0.681671142578125, -0.6612930297851562, -0.6409149169921875, -0.6205368041992188, -0.60015869140625, -0.5797805786132812, -0.5594024658203125, -0.5390243530273438, -0.518646240234375, -0.49826812744140625, -0.4778900146484375, -0.45751190185546875, -0.4371337890625, -0.41675567626953125, -0.3963775634765625, -0.37599945068359375, -0.355621337890625, -0.33524322509765625, -0.3148651123046875, -0.29448699951171875, -0.27410888671875, -0.25373077392578125, -0.2333526611328125, -0.21297454833984375, -0.192596435546875, -0.17221832275390625, -0.1518402099609375, -0.13146209716796875, -0.111083984375, -0.09070587158203125, -0.0703277587890625, -0.04994964599609375, -0.029571533203125, -0.00919342041015625, 0.0111846923828125, 0.03156280517578125, 0.05194091796875, 0.07231903076171875, 0.0926971435546875, 0.11307525634765625, 0.133453369140625, 0.15383148193359375, 0.1742095947265625, 0.19458770751953125, 0.2149658203125, 0.23534393310546875, 0.2557220458984375, 0.27610015869140625, 0.296478271484375, 0.31685638427734375, 0.3372344970703125, 0.35761260986328125, 0.37799072265625, 0.39836883544921875, 0.4187469482421875, 0.43912506103515625, 0.459503173828125, 0.47988128662109375, 0.5002593994140625, 0.5206375122070312, 0.541015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 13.0, 18.0, 17.0, 39.0, 38.0, 80.0, 140.0, 232.0, 439.0, 982.0, 2598.0, 9705.0, 51349.0, 296788.0, 528877.0, 128000.0, 21554.0, 4684.0, 1525.0, 682.0, 308.0, 190.0, 89.0, 66.0, 47.0, 20.0, 12.0, 9.0, 12.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.97265625, -4.81353759765625, -4.6544189453125, -4.49530029296875, -4.336181640625, -4.17706298828125, -4.0179443359375, -3.85882568359375, -3.69970703125, -3.54058837890625, -3.3814697265625, -3.22235107421875, -3.063232421875, -2.90411376953125, -2.7449951171875, -2.58587646484375, -2.4267578125, -2.26763916015625, -2.1085205078125, -1.94940185546875, -1.790283203125, -1.63116455078125, -1.4720458984375, -1.31292724609375, -1.15380859375, -0.99468994140625, -0.8355712890625, -0.67645263671875, -0.517333984375, -0.35821533203125, -0.1990966796875, -0.03997802734375, 0.119140625, 0.27825927734375, 0.4373779296875, 0.59649658203125, 0.755615234375, 0.91473388671875, 1.0738525390625, 1.23297119140625, 1.39208984375, 1.55120849609375, 1.7103271484375, 1.86944580078125, 2.028564453125, 2.18768310546875, 2.3468017578125, 2.50592041015625, 2.6650390625, 2.82415771484375, 2.9832763671875, 3.14239501953125, 3.301513671875, 3.46063232421875, 3.6197509765625, 3.77886962890625, 3.93798828125, 4.09710693359375, 4.2562255859375, 4.41534423828125, 4.574462890625, 4.73358154296875, 4.8927001953125, 5.05181884765625, 5.2109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 13.0, 9.0, 17.0, 17.0, 21.0, 16.0, 19.0, 32.0, 32.0, 40.0, 42.0, 34.0, 47.0, 42.0, 45.0, 62.0, 48.0, 42.0, 41.0, 51.0, 52.0, 36.0, 39.0, 39.0, 27.0, 29.0, 26.0, 19.0, 15.0, 11.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.298828125, -2.21624755859375, -2.1336669921875, -2.05108642578125, -1.968505859375, -1.88592529296875, -1.8033447265625, -1.72076416015625, -1.63818359375, -1.55560302734375, -1.4730224609375, -1.39044189453125, -1.307861328125, -1.22528076171875, -1.1427001953125, -1.06011962890625, -0.9775390625, -0.89495849609375, -0.8123779296875, -0.72979736328125, -0.647216796875, -0.56463623046875, -0.4820556640625, -0.39947509765625, -0.31689453125, -0.23431396484375, -0.1517333984375, -0.06915283203125, 0.013427734375, 0.09600830078125, 0.1785888671875, 0.26116943359375, 0.34375, 0.42633056640625, 0.5089111328125, 0.59149169921875, 0.674072265625, 0.75665283203125, 0.8392333984375, 0.92181396484375, 1.00439453125, 1.08697509765625, 1.1695556640625, 1.25213623046875, 1.334716796875, 1.41729736328125, 1.4998779296875, 1.58245849609375, 1.6650390625, 1.74761962890625, 1.8302001953125, 1.91278076171875, 1.995361328125, 2.07794189453125, 2.1605224609375, 2.24310302734375, 2.32568359375, 2.40826416015625, 2.4908447265625, 2.57342529296875, 2.656005859375, 2.73858642578125, 2.8211669921875, 2.90374755859375, 2.986328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 4.0, 1.0, 5.0, 1.0, 6.0, 6.0, 8.0, 7.0, 8.0, 18.0, 10.0, 16.0, 24.0, 35.0, 53.0, 92.0, 192.0, 397.0, 1074.0, 3365.0, 13175.0, 80883.0, 715523.0, 201928.0, 23544.0, 5443.0, 1608.0, 530.0, 242.0, 127.0, 75.0, 34.0, 27.0, 22.0, 15.0, 12.0, 9.0, 6.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.31640625, -4.19873046875, -4.0810546875, -3.96337890625, -3.845703125, -3.72802734375, -3.6103515625, -3.49267578125, -3.375, -3.25732421875, -3.1396484375, -3.02197265625, -2.904296875, -2.78662109375, -2.6689453125, -2.55126953125, -2.43359375, -2.31591796875, -2.1982421875, -2.08056640625, -1.962890625, -1.84521484375, -1.7275390625, -1.60986328125, -1.4921875, -1.37451171875, -1.2568359375, -1.13916015625, -1.021484375, -0.90380859375, -0.7861328125, -0.66845703125, -0.55078125, -0.43310546875, -0.3154296875, -0.19775390625, -0.080078125, 0.03759765625, 0.1552734375, 0.27294921875, 0.390625, 0.50830078125, 0.6259765625, 0.74365234375, 0.861328125, 0.97900390625, 1.0966796875, 1.21435546875, 1.33203125, 1.44970703125, 1.5673828125, 1.68505859375, 1.802734375, 1.92041015625, 2.0380859375, 2.15576171875, 2.2734375, 2.39111328125, 2.5087890625, 2.62646484375, 2.744140625, 2.86181640625, 2.9794921875, 3.09716796875, 3.21484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 4.0, 6.0, 6.0, 5.0, 14.0, 17.0, 12.0, 22.0, 25.0, 35.0, 59.0, 94.0, 95.0, 122.0, 116.0, 90.0, 70.0, 48.0, 26.0, 28.0, 25.0, 9.0, 11.0, 7.0, 6.0, 3.0, 6.0, 7.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.00040984153747558594, -0.0003980807960033417, -0.0003863200545310974, -0.00037455931305885315, -0.0003627985715866089, -0.0003510378301143646, -0.00033927708864212036, -0.0003275163471698761, -0.00031575560569763184, -0.0003039948642253876, -0.0002922341227531433, -0.00028047338128089905, -0.0002687126398086548, -0.0002569518983364105, -0.00024519115686416626, -0.000233430415391922, -0.00022166967391967773, -0.00020990893244743347, -0.0001981481909751892, -0.00018638744950294495, -0.00017462670803070068, -0.00016286596655845642, -0.00015110522508621216, -0.0001393444836139679, -0.00012758374214172363, -0.00011582300066947937, -0.00010406225919723511, -9.230151772499084e-05, -8.054077625274658e-05, -6.878003478050232e-05, -5.701929330825806e-05, -4.5258551836013794e-05, -3.349781036376953e-05, -2.173706889152527e-05, -9.976327419281006e-06, 1.7844140529632568e-06, 1.354515552520752e-05, 2.5305896997451782e-05, 3.7066638469696045e-05, 4.882737994194031e-05, 6.058812141418457e-05, 7.234886288642883e-05, 8.41096043586731e-05, 9.587034583091736e-05, 0.00010763108730316162, 0.00011939182877540588, 0.00013115257024765015, 0.0001429133117198944, 0.00015467405319213867, 0.00016643479466438293, 0.0001781955361366272, 0.00018995627760887146, 0.00020171701908111572, 0.00021347776055335999, 0.00022523850202560425, 0.0002369992434978485, 0.0002487599849700928, 0.00026052072644233704, 0.0002722814679145813, 0.00028404220938682556, 0.0002958029508590698, 0.0003075636923313141, 0.00031932443380355835, 0.0003310851752758026, 0.0003428459167480469]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 3.0, 6.0, 6.0, 10.0, 19.0, 25.0, 26.0, 66.0, 99.0, 194.0, 396.0, 868.0, 2197.0, 7764.0, 47864.0, 682931.0, 275026.0, 23454.0, 4724.0, 1538.0, 643.0, 292.0, 145.0, 87.0, 54.0, 34.0, 21.0, 15.0, 11.0, 11.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.56671142578125, -5.4068603515625, -5.24700927734375, -5.087158203125, -4.92730712890625, -4.7674560546875, -4.60760498046875, -4.44775390625, -4.28790283203125, -4.1280517578125, -3.96820068359375, -3.808349609375, -3.64849853515625, -3.4886474609375, -3.32879638671875, -3.1689453125, -3.00909423828125, -2.8492431640625, -2.68939208984375, -2.529541015625, -2.36968994140625, -2.2098388671875, -2.04998779296875, -1.89013671875, -1.73028564453125, -1.5704345703125, -1.41058349609375, -1.250732421875, -1.09088134765625, -0.9310302734375, -0.77117919921875, -0.611328125, -0.45147705078125, -0.2916259765625, -0.13177490234375, 0.028076171875, 0.18792724609375, 0.3477783203125, 0.50762939453125, 0.66748046875, 0.82733154296875, 0.9871826171875, 1.14703369140625, 1.306884765625, 1.46673583984375, 1.6265869140625, 1.78643798828125, 1.9462890625, 2.10614013671875, 2.2659912109375, 2.42584228515625, 2.585693359375, 2.74554443359375, 2.9053955078125, 3.06524658203125, 3.22509765625, 3.38494873046875, 3.5447998046875, 3.70465087890625, 3.864501953125, 4.02435302734375, 4.1842041015625, 4.34405517578125, 4.50390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 9.0, 12.0, 16.0, 20.0, 33.0, 74.0, 119.0, 199.0, 198.0, 137.0, 49.0, 47.0, 27.0, 19.0, 13.0, 8.0, 9.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.847320556640625, -3.73760986328125, -3.627899169921875, -3.5181884765625, -3.408477783203125, -3.29876708984375, -3.189056396484375, -3.079345703125, -2.969635009765625, -2.85992431640625, -2.750213623046875, -2.6405029296875, -2.530792236328125, -2.42108154296875, -2.311370849609375, -2.20166015625, -2.091949462890625, -1.98223876953125, -1.872528076171875, -1.7628173828125, -1.653106689453125, -1.54339599609375, -1.433685302734375, -1.323974609375, -1.214263916015625, -1.10455322265625, -0.994842529296875, -0.8851318359375, -0.775421142578125, -0.66571044921875, -0.555999755859375, -0.4462890625, -0.336578369140625, -0.22686767578125, -0.117156982421875, -0.0074462890625, 0.102264404296875, 0.21197509765625, 0.321685791015625, 0.431396484375, 0.541107177734375, 0.65081787109375, 0.760528564453125, 0.8702392578125, 0.979949951171875, 1.08966064453125, 1.199371337890625, 1.30908203125, 1.418792724609375, 1.52850341796875, 1.638214111328125, 1.7479248046875, 1.857635498046875, 1.96734619140625, 2.077056884765625, 2.186767578125, 2.296478271484375, 2.40618896484375, 2.515899658203125, 2.6256103515625, 2.735321044921875, 2.84503173828125, 2.954742431640625, 3.064453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 25.0, 39.0, 99.0, 211.0, 245.0, 210.0, 96.0, 47.0, 16.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.828765869140625, -50.19004821777344, -48.551326751708984, -46.9126091003418, -45.27389144897461, -43.635169982910156, -41.99645233154297, -40.35773468017578, -38.71901321411133, -37.08029556274414, -35.44157409667969, -33.8028564453125, -32.16413879394531, -30.52541732788086, -28.886699676513672, -27.24798011779785, -25.609262466430664, -23.970542907714844, -22.331825256347656, -20.693105697631836, -19.054386138916016, -17.415668487548828, -15.776948928833008, -14.138229370117188, -12.499510765075684, -10.86079216003418, -9.22207260131836, -7.5833539962768555, -5.944634914398193, -4.305915832519531, -2.6671972274780273, -1.028477668762207, 0.6102409362792969, 2.248960018157959, 3.887678861618042, 5.526397705078125, 7.165116786956787, 8.80383586883545, 10.442554473876953, 12.081274032592773, 13.719992637634277, 15.358711242675781, 16.9974308013916, 18.636150360107422, 20.27486801147461, 21.91358757019043, 23.55230712890625, 25.191024780273438, 26.829744338989258, 28.468463897705078, 30.107181549072266, 31.745901107788086, 33.384620666503906, 35.023338317871094, 36.66205596923828, 38.300777435302734, 39.93949508666992, 41.57821273803711, 43.21693420410156, 44.85565185546875, 46.49436950683594, 48.13309097290039, 49.77180862426758, 51.41053009033203, 53.04924774169922]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 5.0, 3.0, 14.0, 13.0, 12.0, 18.0, 22.0, 13.0, 26.0, 24.0, 25.0, 31.0, 32.0, 26.0, 39.0, 34.0, 48.0, 41.0, 47.0, 45.0, 52.0, 44.0, 40.0, 29.0, 28.0, 29.0, 34.0, 29.0, 31.0, 26.0, 18.0, 16.0, 15.0, 8.0, 12.0, 12.0, 9.0, 11.0, 9.0, 7.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.740531921386719, -13.325779914855957, -12.911027908325195, -12.496274948120117, -12.081522941589355, -11.666770935058594, -11.252018928527832, -10.83726692199707, -10.422513961791992, -10.00776195526123, -9.593009948730469, -9.17825698852539, -8.763504981994629, -8.348752975463867, -7.9340009689331055, -7.5192484855651855, -7.104496479034424, -6.689744472503662, -6.274991989135742, -5.8602399826049805, -5.4454874992370605, -5.030735492706299, -4.615983009338379, -4.201231002807617, -3.7864787578582764, -3.3717265129089355, -2.9569742679595947, -2.542222023010254, -2.127470016479492, -1.7127177715301514, -1.2979655265808105, -0.8832132816314697, -0.4684610366821289, -0.053708821535110474, 0.36104339361190796, 0.775795578956604, 1.1905478239059448, 1.605299949645996, 2.020052194595337, 2.4348044395446777, 2.8495566844940186, 3.2643089294433594, 3.6790611743927, 4.093813419342041, 4.508565425872803, 4.923317909240723, 5.338069915771484, 5.752821922302246, 6.167574405670166, 6.582326412200928, 6.997078895568848, 7.411830902099609, 7.826583385467529, 8.241334915161133, 8.656087875366211, 9.070839881896973, 9.485591888427734, 9.900343894958496, 10.315095901489258, 10.729848861694336, 11.144600868225098, 11.55935287475586, 11.974104881286621, 12.388856887817383, 12.803609848022461]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 15.0, 21.0, 36.0, 28.0, 53.0, 73.0, 139.0, 208.0, 390.0, 699.0, 1394.0, 2951.0, 6360.0, 15084.0, 39744.0, 132520.0, 1526892.0, 2257525.0, 141414.0, 41205.0, 15512.0, 6314.0, 2880.0, 1379.0, 632.0, 350.0, 194.0, 106.0, 65.0, 28.0, 29.0, 11.0, 6.0, 9.0, 3.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1796875, -4.07257080078125, -3.9654541015625, -3.85833740234375, -3.751220703125, -3.64410400390625, -3.5369873046875, -3.42987060546875, -3.32275390625, -3.21563720703125, -3.1085205078125, -3.00140380859375, -2.894287109375, -2.78717041015625, -2.6800537109375, -2.57293701171875, -2.4658203125, -2.35870361328125, -2.2515869140625, -2.14447021484375, -2.037353515625, -1.93023681640625, -1.8231201171875, -1.71600341796875, -1.60888671875, -1.50177001953125, -1.3946533203125, -1.28753662109375, -1.180419921875, -1.07330322265625, -0.9661865234375, -0.85906982421875, -0.751953125, -0.64483642578125, -0.5377197265625, -0.43060302734375, -0.323486328125, -0.21636962890625, -0.1092529296875, -0.00213623046875, 0.10498046875, 0.21209716796875, 0.3192138671875, 0.42633056640625, 0.533447265625, 0.64056396484375, 0.7476806640625, 0.85479736328125, 0.9619140625, 1.06903076171875, 1.1761474609375, 1.28326416015625, 1.390380859375, 1.49749755859375, 1.6046142578125, 1.71173095703125, 1.81884765625, 1.92596435546875, 2.0330810546875, 2.14019775390625, 2.247314453125, 2.35443115234375, 2.4615478515625, 2.56866455078125, 2.67578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 12.0, 14.0, 11.0, 24.0, 22.0, 29.0, 44.0, 55.0, 44.0, 50.0, 51.0, 67.0, 62.0, 55.0, 66.0, 64.0, 47.0, 50.0, 54.0, 39.0, 27.0, 24.0, 19.0, 17.0, 11.0, 7.0, 6.0, 10.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.81640625, -0.7948760986328125, -0.773345947265625, -0.7518157958984375, -0.73028564453125, -0.7087554931640625, -0.687225341796875, -0.6656951904296875, -0.6441650390625, -0.6226348876953125, -0.601104736328125, -0.5795745849609375, -0.55804443359375, -0.5365142822265625, -0.514984130859375, -0.4934539794921875, -0.471923828125, -0.4503936767578125, -0.428863525390625, -0.4073333740234375, -0.38580322265625, -0.3642730712890625, -0.342742919921875, -0.3212127685546875, -0.2996826171875, -0.2781524658203125, -0.256622314453125, -0.2350921630859375, -0.21356201171875, -0.1920318603515625, -0.170501708984375, -0.1489715576171875, -0.12744140625, -0.1059112548828125, -0.084381103515625, -0.0628509521484375, -0.04132080078125, -0.0197906494140625, 0.001739501953125, 0.0232696533203125, 0.0447998046875, 0.0663299560546875, 0.087860107421875, 0.1093902587890625, 0.13092041015625, 0.1524505615234375, 0.173980712890625, 0.1955108642578125, 0.217041015625, 0.2385711669921875, 0.260101318359375, 0.2816314697265625, 0.30316162109375, 0.3246917724609375, 0.346221923828125, 0.3677520751953125, 0.3892822265625, 0.4108123779296875, 0.432342529296875, 0.4538726806640625, 0.47540283203125, 0.4969329833984375, 0.518463134765625, 0.5399932861328125, 0.5615234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 9.0, 14.0, 41.0, 109.0, 257.0, 726.0, 2220.0, 7771.0, 37024.0, 286738.0, 3515136.0, 295108.0, 38062.0, 7916.0, 2073.0, 660.0, 257.0, 88.0, 34.0, 15.0, 13.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.4375, -7.26251220703125, -7.0875244140625, -6.91253662109375, -6.737548828125, -6.56256103515625, -6.3875732421875, -6.21258544921875, -6.03759765625, -5.86260986328125, -5.6876220703125, -5.51263427734375, -5.337646484375, -5.16265869140625, -4.9876708984375, -4.81268310546875, -4.6376953125, -4.46270751953125, -4.2877197265625, -4.11273193359375, -3.937744140625, -3.76275634765625, -3.5877685546875, -3.41278076171875, -3.23779296875, -3.06280517578125, -2.8878173828125, -2.71282958984375, -2.537841796875, -2.36285400390625, -2.1878662109375, -2.01287841796875, -1.837890625, -1.66290283203125, -1.4879150390625, -1.31292724609375, -1.137939453125, -0.96295166015625, -0.7879638671875, -0.61297607421875, -0.43798828125, -0.26300048828125, -0.0880126953125, 0.08697509765625, 0.261962890625, 0.43695068359375, 0.6119384765625, 0.78692626953125, 0.9619140625, 1.13690185546875, 1.3118896484375, 1.48687744140625, 1.661865234375, 1.83685302734375, 2.0118408203125, 2.18682861328125, 2.36181640625, 2.53680419921875, 2.7117919921875, 2.88677978515625, 3.061767578125, 3.23675537109375, 3.4117431640625, 3.58673095703125, 3.76171875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 11.0, 12.0, 6.0, 15.0, 30.0, 14.0, 32.0, 48.0, 43.0, 81.0, 111.0, 145.0, 242.0, 531.0, 1170.0, 574.0, 301.0, 178.0, 136.0, 88.0, 66.0, 54.0, 33.0, 33.0, 14.0, 18.0, 16.0, 15.0, 12.0, 12.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.18359375, -1.1461639404296875, -1.108734130859375, -1.0713043212890625, -1.03387451171875, -0.9964447021484375, -0.959014892578125, -0.9215850830078125, -0.8841552734375, -0.8467254638671875, -0.809295654296875, -0.7718658447265625, -0.73443603515625, -0.6970062255859375, -0.659576416015625, -0.6221466064453125, -0.584716796875, -0.5472869873046875, -0.509857177734375, -0.4724273681640625, -0.43499755859375, -0.3975677490234375, -0.360137939453125, -0.3227081298828125, -0.2852783203125, -0.2478485107421875, -0.210418701171875, -0.1729888916015625, -0.13555908203125, -0.0981292724609375, -0.060699462890625, -0.0232696533203125, 0.01416015625, 0.0515899658203125, 0.089019775390625, 0.1264495849609375, 0.16387939453125, 0.2013092041015625, 0.238739013671875, 0.2761688232421875, 0.3135986328125, 0.3510284423828125, 0.388458251953125, 0.4258880615234375, 0.46331787109375, 0.5007476806640625, 0.538177490234375, 0.5756072998046875, 0.613037109375, 0.6504669189453125, 0.687896728515625, 0.7253265380859375, 0.76275634765625, 0.8001861572265625, 0.837615966796875, 0.8750457763671875, 0.9124755859375, 0.9499053955078125, 0.987335205078125, 1.0247650146484375, 1.06219482421875, 1.0996246337890625, 1.137054443359375, 1.1744842529296875, 1.2119140625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 16.0, 13.0, 25.0, 49.0, 71.0, 75.0, 94.0, 106.0, 100.0, 98.0, 92.0, 78.0, 46.0, 53.0, 23.0, 13.0, 10.0, 8.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.627416610717773, -6.313331604003906, -5.999247074127197, -5.685162544250488, -5.371077537536621, -5.056992530822754, -4.742908000946045, -4.428823471069336, -4.114738464355469, -3.8006536960601807, -3.4865689277648926, -3.1724841594696045, -2.8583993911743164, -2.5443146228790283, -2.2302298545837402, -1.9161450862884521, -1.602060317993164, -1.287975549697876, -0.9738907814025879, -0.6598060131072998, -0.3457212448120117, -0.03163647651672363, 0.28244829177856445, 0.5965330600738525, 0.9106178283691406, 1.2247025966644287, 1.5387873649597168, 1.8528721332550049, 2.166956901550293, 2.481041669845581, 2.795126438140869, 3.1092112064361572, 3.4232969284057617, 3.73738169670105, 4.051466464996338, 4.365550994873047, 4.679636001586914, 4.993721008300781, 5.30780553817749, 5.621890068054199, 5.935975074768066, 6.250060081481934, 6.564144611358643, 6.878229141235352, 7.192314147949219, 7.506399154663086, 7.820483684539795, 8.134568214416504, 8.448653221130371, 8.762738227844238, 9.076822280883789, 9.390907287597656, 9.704992294311523, 10.01907730102539, 10.333162307739258, 10.647246360778809, 10.961331367492676, 11.275416374206543, 11.589500427246094, 11.903585433959961, 12.217670440673828, 12.531755447387695, 12.845840454101562, 13.159924507141113, 13.47400951385498]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 9.0, 10.0, 11.0, 9.0, 18.0, 15.0, 22.0, 38.0, 37.0, 42.0, 47.0, 45.0, 46.0, 42.0, 41.0, 46.0, 39.0, 62.0, 54.0, 48.0, 46.0, 43.0, 38.0, 41.0, 25.0, 30.0, 24.0, 22.0, 10.0, 12.0, 5.0, 4.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.186864852905273, -5.988927841186523, -5.790990829467773, -5.593053817749023, -5.395116806030273, -5.197179794311523, -4.999242782592773, -4.801306247711182, -4.603369235992432, -4.405432224273682, -4.207495212554932, -4.009558200836182, -3.8116214275360107, -3.6136844158172607, -3.4157474040985107, -3.21781063079834, -3.0198733806610107, -2.8219363689422607, -2.6239993572235107, -2.42606258392334, -2.22812557220459, -2.03018856048584, -1.8322515487670898, -1.6343146562576294, -1.4363776445388794, -1.2384406328201294, -1.040503740310669, -0.842566728591919, -0.6446297764778137, -0.4466928243637085, -0.2487558126449585, -0.05081892013549805, 0.14711809158325195, 0.3450550436973572, 0.5429919958114624, 0.7409290075302124, 0.9388659596443176, 1.1368029117584229, 1.3347399234771729, 1.5326768159866333, 1.7306138277053833, 1.9285508394241333, 2.1264877319335938, 2.3244247436523438, 2.5223617553710938, 2.7202987670898438, 2.9182357788085938, 3.1161725521087646, 3.3141095638275146, 3.5120465755462646, 3.7099835872650146, 3.9079203605651855, 4.1058573722839355, 4.3037943840026855, 4.5017313957214355, 4.6996684074401855, 4.8976054191589355, 5.0955424308776855, 5.2934794425964355, 5.4914164543151855, 5.6893534660339355, 5.887290000915527, 6.085227012634277, 6.283164024353027, 6.481101036071777]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 3.0, 6.0, 16.0, 12.0, 17.0, 30.0, 46.0, 84.0, 126.0, 214.0, 376.0, 633.0, 1155.0, 2256.0, 4423.0, 8894.0, 18709.0, 39128.0, 83019.0, 182636.0, 347411.0, 192965.0, 86591.0, 41413.0, 19468.0, 9225.0, 4591.0, 2310.0, 1199.0, 673.0, 331.0, 226.0, 133.0, 74.0, 47.0, 31.0, 26.0, 24.0, 6.0, 3.0, 9.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.650390625, -2.560638427734375, -2.47088623046875, -2.381134033203125, -2.2913818359375, -2.201629638671875, -2.11187744140625, -2.022125244140625, -1.932373046875, -1.842620849609375, -1.75286865234375, -1.663116455078125, -1.5733642578125, -1.483612060546875, -1.39385986328125, -1.304107666015625, -1.21435546875, -1.124603271484375, -1.03485107421875, -0.945098876953125, -0.8553466796875, -0.765594482421875, -0.67584228515625, -0.586090087890625, -0.496337890625, -0.406585693359375, -0.31683349609375, -0.227081298828125, -0.1373291015625, -0.047576904296875, 0.04217529296875, 0.131927490234375, 0.2216796875, 0.311431884765625, 0.40118408203125, 0.490936279296875, 0.5806884765625, 0.670440673828125, 0.76019287109375, 0.849945068359375, 0.939697265625, 1.029449462890625, 1.11920166015625, 1.208953857421875, 1.2987060546875, 1.388458251953125, 1.47821044921875, 1.567962646484375, 1.65771484375, 1.747467041015625, 1.83721923828125, 1.926971435546875, 2.0167236328125, 2.106475830078125, 2.19622802734375, 2.285980224609375, 2.375732421875, 2.465484619140625, 2.55523681640625, 2.644989013671875, 2.7347412109375, 2.824493408203125, 2.91424560546875, 3.003997802734375, 3.09375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 6.0, 11.0, 3.0, 14.0, 16.0, 20.0, 27.0, 26.0, 37.0, 42.0, 52.0, 46.0, 56.0, 64.0, 57.0, 51.0, 62.0, 65.0, 56.0, 48.0, 44.0, 37.0, 37.0, 29.0, 26.0, 12.0, 15.0, 14.0, 8.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8359375, -0.81463623046875, -0.7933349609375, -0.77203369140625, -0.750732421875, -0.72943115234375, -0.7081298828125, -0.68682861328125, -0.66552734375, -0.64422607421875, -0.6229248046875, -0.60162353515625, -0.580322265625, -0.55902099609375, -0.5377197265625, -0.51641845703125, -0.4951171875, -0.47381591796875, -0.4525146484375, -0.43121337890625, -0.409912109375, -0.38861083984375, -0.3673095703125, -0.34600830078125, -0.32470703125, -0.30340576171875, -0.2821044921875, -0.26080322265625, -0.239501953125, -0.21820068359375, -0.1968994140625, -0.17559814453125, -0.154296875, -0.13299560546875, -0.1116943359375, -0.09039306640625, -0.069091796875, -0.04779052734375, -0.0264892578125, -0.00518798828125, 0.01611328125, 0.03741455078125, 0.0587158203125, 0.08001708984375, 0.101318359375, 0.12261962890625, 0.1439208984375, 0.16522216796875, 0.1865234375, 0.20782470703125, 0.2291259765625, 0.25042724609375, 0.271728515625, 0.29302978515625, 0.3143310546875, 0.33563232421875, 0.35693359375, 0.37823486328125, 0.3995361328125, 0.42083740234375, 0.442138671875, 0.46343994140625, 0.4847412109375, 0.50604248046875, 0.52734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 11.0, 9.0, 20.0, 34.0, 49.0, 81.0, 161.0, 291.0, 680.0, 1540.0, 4102.0, 13044.0, 49512.0, 197141.0, 516694.0, 195556.0, 49205.0, 13377.0, 4176.0, 1534.0, 641.0, 314.0, 136.0, 91.0, 55.0, 31.0, 24.0, 9.0, 9.0, 6.0, 7.0, 0.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.373046875, -3.240753173828125, -3.10845947265625, -2.976165771484375, -2.8438720703125, -2.711578369140625, -2.57928466796875, -2.446990966796875, -2.314697265625, -2.182403564453125, -2.05010986328125, -1.917816162109375, -1.7855224609375, -1.653228759765625, -1.52093505859375, -1.388641357421875, -1.25634765625, -1.124053955078125, -0.99176025390625, -0.859466552734375, -0.7271728515625, -0.594879150390625, -0.46258544921875, -0.330291748046875, -0.197998046875, -0.065704345703125, 0.06658935546875, 0.198883056640625, 0.3311767578125, 0.463470458984375, 0.59576416015625, 0.728057861328125, 0.8603515625, 0.992645263671875, 1.12493896484375, 1.257232666015625, 1.3895263671875, 1.521820068359375, 1.65411376953125, 1.786407470703125, 1.918701171875, 2.050994873046875, 2.18328857421875, 2.315582275390625, 2.4478759765625, 2.580169677734375, 2.71246337890625, 2.844757080078125, 2.97705078125, 3.109344482421875, 3.24163818359375, 3.373931884765625, 3.5062255859375, 3.638519287109375, 3.77081298828125, 3.903106689453125, 4.035400390625, 4.167694091796875, 4.29998779296875, 4.432281494140625, 4.5645751953125, 4.696868896484375, 4.82916259765625, 4.961456298828125, 5.09375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 4.0, 18.0, 13.0, 21.0, 19.0, 30.0, 23.0, 30.0, 25.0, 42.0, 32.0, 54.0, 44.0, 43.0, 41.0, 38.0, 42.0, 36.0, 47.0, 29.0, 44.0, 31.0, 46.0, 38.0, 29.0, 34.0, 25.0, 32.0, 22.0, 13.0, 9.0, 8.0, 7.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.821075439453125, -2.73394775390625, -2.646820068359375, -2.5596923828125, -2.472564697265625, -2.38543701171875, -2.298309326171875, -2.211181640625, -2.124053955078125, -2.03692626953125, -1.949798583984375, -1.8626708984375, -1.775543212890625, -1.68841552734375, -1.601287841796875, -1.51416015625, -1.427032470703125, -1.33990478515625, -1.252777099609375, -1.1656494140625, -1.078521728515625, -0.99139404296875, -0.904266357421875, -0.817138671875, -0.730010986328125, -0.64288330078125, -0.555755615234375, -0.4686279296875, -0.381500244140625, -0.29437255859375, -0.207244873046875, -0.1201171875, -0.032989501953125, 0.05413818359375, 0.141265869140625, 0.2283935546875, 0.315521240234375, 0.40264892578125, 0.489776611328125, 0.576904296875, 0.664031982421875, 0.75115966796875, 0.838287353515625, 0.9254150390625, 1.012542724609375, 1.09967041015625, 1.186798095703125, 1.27392578125, 1.361053466796875, 1.44818115234375, 1.535308837890625, 1.6224365234375, 1.709564208984375, 1.79669189453125, 1.883819580078125, 1.970947265625, 2.058074951171875, 2.14520263671875, 2.232330322265625, 2.3194580078125, 2.406585693359375, 2.49371337890625, 2.580841064453125, 2.66796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 16.0, 21.0, 21.0, 40.0, 41.0, 84.0, 120.0, 186.0, 331.0, 518.0, 1041.0, 1963.0, 4481.0, 14297.0, 92331.0, 755140.0, 148470.0, 19193.0, 5425.0, 2286.0, 1118.0, 565.0, 323.0, 188.0, 114.0, 62.0, 56.0, 34.0, 19.0, 18.0, 15.0, 5.0, 5.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.923828125, -3.776275634765625, -3.62872314453125, -3.481170654296875, -3.3336181640625, -3.186065673828125, -3.03851318359375, -2.890960693359375, -2.743408203125, -2.595855712890625, -2.44830322265625, -2.300750732421875, -2.1531982421875, -2.005645751953125, -1.85809326171875, -1.710540771484375, -1.56298828125, -1.415435791015625, -1.26788330078125, -1.120330810546875, -0.9727783203125, -0.825225830078125, -0.67767333984375, -0.530120849609375, -0.382568359375, -0.235015869140625, -0.08746337890625, 0.060089111328125, 0.2076416015625, 0.355194091796875, 0.50274658203125, 0.650299072265625, 0.7978515625, 0.945404052734375, 1.09295654296875, 1.240509033203125, 1.3880615234375, 1.535614013671875, 1.68316650390625, 1.830718994140625, 1.978271484375, 2.125823974609375, 2.27337646484375, 2.420928955078125, 2.5684814453125, 2.716033935546875, 2.86358642578125, 3.011138916015625, 3.15869140625, 3.306243896484375, 3.45379638671875, 3.601348876953125, 3.7489013671875, 3.896453857421875, 4.04400634765625, 4.191558837890625, 4.339111328125, 4.486663818359375, 4.63421630859375, 4.781768798828125, 4.9293212890625, 5.076873779296875, 5.22442626953125, 5.371978759765625, 5.51953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 7.0, 3.0, 5.0, 13.0, 11.0, 26.0, 42.0, 71.0, 129.0, 301.0, 196.0, 77.0, 48.0, 25.0, 18.0, 17.0, 8.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009870529174804688, -0.0009559690952301025, -0.0009248852729797363, -0.0008938014507293701, -0.0008627176284790039, -0.0008316338062286377, -0.0008005499839782715, -0.0007694661617279053, -0.0007383823394775391, -0.0007072985172271729, -0.0006762146949768066, -0.0006451308727264404, -0.0006140470504760742, -0.000582963228225708, -0.0005518794059753418, -0.0005207955837249756, -0.0004897117614746094, -0.00045862793922424316, -0.00042754411697387695, -0.00039646029472351074, -0.00036537647247314453, -0.0003342926502227783, -0.0003032088279724121, -0.0002721250057220459, -0.0002410411834716797, -0.00020995736122131348, -0.00017887353897094727, -0.00014778971672058105, -0.00011670589447021484, -8.562207221984863e-05, -5.453824996948242e-05, -2.345442771911621e-05, 7.62939453125e-06, 3.871321678161621e-05, 6.979703903198242e-05, 0.00010088086128234863, 0.00013196468353271484, 0.00016304850578308105, 0.00019413232803344727, 0.00022521615028381348, 0.0002562999725341797, 0.0002873837947845459, 0.0003184676170349121, 0.0003495514392852783, 0.00038063526153564453, 0.00041171908378601074, 0.00044280290603637695, 0.00047388672828674316, 0.0005049705505371094, 0.0005360543727874756, 0.0005671381950378418, 0.000598222017288208, 0.0006293058395385742, 0.0006603896617889404, 0.0006914734840393066, 0.0007225573062896729, 0.0007536411285400391, 0.0007847249507904053, 0.0008158087730407715, 0.0008468925952911377, 0.0008779764175415039, 0.0009090602397918701, 0.0009401440620422363, 0.0009712278842926025, 0.0010023117065429688]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 9.0, 3.0, 22.0, 18.0, 33.0, 75.0, 108.0, 224.0, 370.0, 848.0, 1921.0, 4592.0, 14118.0, 95821.0, 788083.0, 117515.0, 16027.0, 4929.0, 1950.0, 882.0, 479.0, 235.0, 113.0, 61.0, 40.0, 22.0, 11.0, 14.0, 4.0, 4.0, 2.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.53515625, -5.36505126953125, -5.1949462890625, -5.02484130859375, -4.854736328125, -4.68463134765625, -4.5145263671875, -4.34442138671875, -4.17431640625, -4.00421142578125, -3.8341064453125, -3.66400146484375, -3.493896484375, -3.32379150390625, -3.1536865234375, -2.98358154296875, -2.8134765625, -2.64337158203125, -2.4732666015625, -2.30316162109375, -2.133056640625, -1.96295166015625, -1.7928466796875, -1.62274169921875, -1.45263671875, -1.28253173828125, -1.1124267578125, -0.94232177734375, -0.772216796875, -0.60211181640625, -0.4320068359375, -0.26190185546875, -0.091796875, 0.07830810546875, 0.2484130859375, 0.41851806640625, 0.588623046875, 0.75872802734375, 0.9288330078125, 1.09893798828125, 1.26904296875, 1.43914794921875, 1.6092529296875, 1.77935791015625, 1.949462890625, 2.11956787109375, 2.2896728515625, 2.45977783203125, 2.6298828125, 2.79998779296875, 2.9700927734375, 3.14019775390625, 3.310302734375, 3.48040771484375, 3.6505126953125, 3.82061767578125, 3.99072265625, 4.16082763671875, 4.3309326171875, 4.50103759765625, 4.671142578125, 4.84124755859375, 5.0113525390625, 5.18145751953125, 5.3515625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 9.0, 7.0, 15.0, 13.0, 11.0, 27.0, 27.0, 50.0, 61.0, 100.0, 120.0, 132.0, 111.0, 77.0, 57.0, 42.0, 31.0, 21.0, 24.0, 12.0, 7.0, 5.0, 7.0, 8.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-2.45703125, -2.383209228515625, -2.30938720703125, -2.235565185546875, -2.1617431640625, -2.087921142578125, -2.01409912109375, -1.940277099609375, -1.866455078125, -1.792633056640625, -1.71881103515625, -1.644989013671875, -1.5711669921875, -1.497344970703125, -1.42352294921875, -1.349700927734375, -1.27587890625, -1.202056884765625, -1.12823486328125, -1.054412841796875, -0.9805908203125, -0.906768798828125, -0.83294677734375, -0.759124755859375, -0.685302734375, -0.611480712890625, -0.53765869140625, -0.463836669921875, -0.3900146484375, -0.316192626953125, -0.24237060546875, -0.168548583984375, -0.0947265625, -0.020904541015625, 0.05291748046875, 0.126739501953125, 0.2005615234375, 0.274383544921875, 0.34820556640625, 0.422027587890625, 0.495849609375, 0.569671630859375, 0.64349365234375, 0.717315673828125, 0.7911376953125, 0.864959716796875, 0.93878173828125, 1.012603759765625, 1.08642578125, 1.160247802734375, 1.23406982421875, 1.307891845703125, 1.3817138671875, 1.455535888671875, 1.52935791015625, 1.603179931640625, 1.677001953125, 1.750823974609375, 1.82464599609375, 1.898468017578125, 1.9722900390625, 2.046112060546875, 2.11993408203125, 2.193756103515625, 2.267578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 10.0, 17.0, 34.0, 51.0, 66.0, 125.0, 171.0, 167.0, 140.0, 105.0, 47.0, 35.0, 20.0, 9.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.747520446777344, -41.50143814086914, -40.25535583496094, -39.009273529052734, -37.76319122314453, -36.51710510253906, -35.27102279663086, -34.024940490722656, -32.77885818481445, -31.53277587890625, -30.286693572998047, -29.04060935974121, -27.794527053833008, -26.548444747924805, -25.30236053466797, -24.056278228759766, -22.810195922851562, -21.56411361694336, -20.318031311035156, -19.07194709777832, -17.825864791870117, -16.579782485961914, -15.333699226379395, -14.087615966796875, -12.841533660888672, -11.595451354980469, -10.34936809539795, -9.10328483581543, -7.857202529907227, -6.611119747161865, -5.365036964416504, -4.118953704833984, -2.8728675842285156, -1.6267848014831543, -0.38070201873779297, 0.8653807640075684, 2.1114635467529297, 3.357546329498291, 4.603629112243652, 5.849712371826172, 7.095794677734375, 8.341876983642578, 9.587960243225098, 10.834043502807617, 12.08012580871582, 13.326208114624023, 14.572291374206543, 15.818374633789062, 17.064456939697266, 18.31053924560547, 19.556621551513672, 20.802705764770508, 22.04878807067871, 23.294870376586914, 24.54095458984375, 25.787036895751953, 27.033119201660156, 28.27920150756836, 29.525283813476562, 30.7713680267334, 32.01744842529297, 33.26353454589844, 34.50961685180664, 35.755699157714844, 37.00178146362305]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 9.0, 5.0, 5.0, 15.0, 13.0, 15.0, 25.0, 30.0, 29.0, 22.0, 42.0, 55.0, 48.0, 45.0, 52.0, 54.0, 52.0, 58.0, 54.0, 48.0, 41.0, 62.0, 45.0, 45.0, 27.0, 27.0, 17.0, 18.0, 8.0, 11.0, 3.0, 4.0, 7.0, 6.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.627655029296875, -22.995698928833008, -22.36374282836914, -21.731786727905273, -21.099830627441406, -20.467872619628906, -19.835918426513672, -19.203960418701172, -18.572004318237305, -17.940048217773438, -17.30809211730957, -16.676136016845703, -16.044179916381836, -15.412222862243652, -14.780266761779785, -14.148309707641602, -13.51635456085205, -12.884398460388184, -12.252442359924316, -11.620485305786133, -10.988529205322266, -10.356573104858398, -9.724617004394531, -9.092660903930664, -8.460704803466797, -7.82874870300293, -7.196792125701904, -6.564836025238037, -5.932879447937012, -5.3009233474731445, -4.668967247009277, -4.037010669708252, -3.4050540924072266, -2.7730977535247803, -2.141141414642334, -1.5091853141784668, -0.8772289752960205, -0.24527263641357422, 0.38668346405029297, 1.0186400413513184, 1.6505961418151855, 2.282552480697632, 2.914508819580078, 3.5464649200439453, 4.1784210205078125, 4.810377597808838, 5.442333698272705, 6.0742902755737305, 6.706246376037598, 7.338202476501465, 7.97015905380249, 8.602115631103516, 9.234071731567383, 9.86602783203125, 10.497983932495117, 11.129940032958984, 11.761896133422852, 12.393852233886719, 13.025808334350586, 13.657764434814453, 14.289721488952637, 14.921677589416504, 15.553633689880371, 16.185590744018555, 16.817546844482422]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 8.0, 13.0, 20.0, 20.0, 31.0, 50.0, 64.0, 107.0, 187.0, 243.0, 470.0, 738.0, 1260.0, 2458.0, 5032.0, 12117.0, 34850.0, 140039.0, 3387767.0, 500314.0, 71279.0, 21385.0, 8113.0, 3507.0, 1798.0, 972.0, 526.0, 318.0, 235.0, 124.0, 74.0, 61.0, 32.0, 15.0, 21.0, 7.0, 11.0, 4.0, 1.0, 1.0, 4.0, 3.0], "bins": [-5.08984375, -4.96502685546875, -4.8402099609375, -4.71539306640625, -4.590576171875, -4.46575927734375, -4.3409423828125, -4.21612548828125, -4.09130859375, -3.96649169921875, -3.8416748046875, -3.71685791015625, -3.592041015625, -3.46722412109375, -3.3424072265625, -3.21759033203125, -3.0927734375, -2.96795654296875, -2.8431396484375, -2.71832275390625, -2.593505859375, -2.46868896484375, -2.3438720703125, -2.21905517578125, -2.09423828125, -1.96942138671875, -1.8446044921875, -1.71978759765625, -1.594970703125, -1.47015380859375, -1.3453369140625, -1.22052001953125, -1.095703125, -0.97088623046875, -0.8460693359375, -0.72125244140625, -0.596435546875, -0.47161865234375, -0.3468017578125, -0.22198486328125, -0.09716796875, 0.02764892578125, 0.1524658203125, 0.27728271484375, 0.402099609375, 0.52691650390625, 0.6517333984375, 0.77655029296875, 0.9013671875, 1.02618408203125, 1.1510009765625, 1.27581787109375, 1.400634765625, 1.52545166015625, 1.6502685546875, 1.77508544921875, 1.89990234375, 2.02471923828125, 2.1495361328125, 2.27435302734375, 2.399169921875, 2.52398681640625, 2.6488037109375, 2.77362060546875, 2.8984375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 3.0, 13.0, 26.0, 21.0, 23.0, 30.0, 35.0, 49.0, 58.0, 62.0, 70.0, 72.0, 68.0, 58.0, 68.0, 58.0, 57.0, 64.0, 32.0, 34.0, 30.0, 21.0, 12.0, 8.0, 10.0, 9.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.103515625, -1.0761642456054688, -1.0488128662109375, -1.0214614868164062, -0.994110107421875, -0.9667587280273438, -0.9394073486328125, -0.9120559692382812, -0.88470458984375, -0.8573532104492188, -0.8300018310546875, -0.8026504516601562, -0.775299072265625, -0.7479476928710938, -0.7205963134765625, -0.6932449340820312, -0.6658935546875, -0.6385421752929688, -0.6111907958984375, -0.5838394165039062, -0.556488037109375, -0.5291366577148438, -0.5017852783203125, -0.47443389892578125, -0.44708251953125, -0.41973114013671875, -0.3923797607421875, -0.36502838134765625, -0.337677001953125, -0.31032562255859375, -0.2829742431640625, -0.25562286376953125, -0.228271484375, -0.20092010498046875, -0.1735687255859375, -0.14621734619140625, -0.118865966796875, -0.09151458740234375, -0.0641632080078125, -0.03681182861328125, -0.00946044921875, 0.01789093017578125, 0.0452423095703125, 0.07259368896484375, 0.099945068359375, 0.12729644775390625, 0.1546478271484375, 0.18199920654296875, 0.2093505859375, 0.23670196533203125, 0.2640533447265625, 0.29140472412109375, 0.318756103515625, 0.34610748291015625, 0.3734588623046875, 0.40081024169921875, 0.42816162109375, 0.45551300048828125, 0.4828643798828125, 0.5102157592773438, 0.537567138671875, 0.5649185180664062, 0.5922698974609375, 0.6196212768554688, 0.64697265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 4.0, 13.0, 20.0, 24.0, 39.0, 37.0, 68.0, 101.0, 177.0, 287.0, 443.0, 849.0, 1628.0, 3501.0, 8436.0, 23976.0, 83351.0, 485935.0, 3245773.0, 254757.0, 55643.0, 17210.0, 6245.0, 2624.0, 1325.0, 717.0, 418.0, 212.0, 148.0, 89.0, 75.0, 37.0, 37.0, 35.0, 17.0, 11.0, 2.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0234375, -3.89508056640625, -3.7667236328125, -3.63836669921875, -3.510009765625, -3.38165283203125, -3.2532958984375, -3.12493896484375, -2.99658203125, -2.86822509765625, -2.7398681640625, -2.61151123046875, -2.483154296875, -2.35479736328125, -2.2264404296875, -2.09808349609375, -1.9697265625, -1.84136962890625, -1.7130126953125, -1.58465576171875, -1.456298828125, -1.32794189453125, -1.1995849609375, -1.07122802734375, -0.94287109375, -0.81451416015625, -0.6861572265625, -0.55780029296875, -0.429443359375, -0.30108642578125, -0.1727294921875, -0.04437255859375, 0.083984375, 0.21234130859375, 0.3406982421875, 0.46905517578125, 0.597412109375, 0.72576904296875, 0.8541259765625, 0.98248291015625, 1.11083984375, 1.23919677734375, 1.3675537109375, 1.49591064453125, 1.624267578125, 1.75262451171875, 1.8809814453125, 2.00933837890625, 2.1376953125, 2.26605224609375, 2.3944091796875, 2.52276611328125, 2.651123046875, 2.77947998046875, 2.9078369140625, 3.03619384765625, 3.16455078125, 3.29290771484375, 3.4212646484375, 3.54962158203125, 3.677978515625, 3.80633544921875, 3.9346923828125, 4.06304931640625, 4.19140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 3.0, 16.0, 20.0, 33.0, 29.0, 55.0, 112.0, 172.0, 389.0, 1692.0, 807.0, 314.0, 153.0, 99.0, 54.0, 30.0, 28.0, 13.0, 12.0, 9.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.509765625, -1.451263427734375, -1.39276123046875, -1.334259033203125, -1.2757568359375, -1.217254638671875, -1.15875244140625, -1.100250244140625, -1.041748046875, -0.983245849609375, -0.92474365234375, -0.866241455078125, -0.8077392578125, -0.749237060546875, -0.69073486328125, -0.632232666015625, -0.57373046875, -0.515228271484375, -0.45672607421875, -0.398223876953125, -0.3397216796875, -0.281219482421875, -0.22271728515625, -0.164215087890625, -0.105712890625, -0.047210693359375, 0.01129150390625, 0.069793701171875, 0.1282958984375, 0.186798095703125, 0.24530029296875, 0.303802490234375, 0.3623046875, 0.420806884765625, 0.47930908203125, 0.537811279296875, 0.5963134765625, 0.654815673828125, 0.71331787109375, 0.771820068359375, 0.830322265625, 0.888824462890625, 0.94732666015625, 1.005828857421875, 1.0643310546875, 1.122833251953125, 1.18133544921875, 1.239837646484375, 1.29833984375, 1.356842041015625, 1.41534423828125, 1.473846435546875, 1.5323486328125, 1.590850830078125, 1.64935302734375, 1.707855224609375, 1.766357421875, 1.824859619140625, 1.88336181640625, 1.941864013671875, 2.0003662109375, 2.058868408203125, 2.11737060546875, 2.175872802734375, 2.234375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 1.0, 7.0, 25.0, 31.0, 47.0, 67.0, 104.0, 120.0, 147.0, 110.0, 120.0, 79.0, 52.0, 28.0, 24.0, 23.0, 8.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.568680763244629, -13.186437606811523, -12.804195404052734, -12.421953201293945, -12.03971004486084, -11.657466888427734, -11.275224685668945, -10.892982482910156, -10.51073932647705, -10.128496170043945, -9.746253967285156, -9.364011764526367, -8.981768608093262, -8.599525451660156, -8.217283248901367, -7.83504056930542, -7.452797889709473, -7.070555210113525, -6.688312530517578, -6.306069850921631, -5.923827171325684, -5.541584491729736, -5.159341812133789, -4.777099132537842, -4.3948564529418945, -4.012613773345947, -3.63037109375, -3.2481284141540527, -2.8658857345581055, -2.483643054962158, -2.101400375366211, -1.7191576957702637, -1.3369140625, -0.9546713829040527, -0.5724287033081055, -0.1901860237121582, 0.19205665588378906, 0.5742993354797363, 0.9565420150756836, 1.3387846946716309, 1.7210273742675781, 2.1032700538635254, 2.4855127334594727, 2.86775541305542, 3.249998092651367, 3.6322407722473145, 4.014483451843262, 4.396726131439209, 4.778968811035156, 5.1612114906311035, 5.543454170227051, 5.925696849822998, 6.307939529418945, 6.690182209014893, 7.07242488861084, 7.454667568206787, 7.836910247802734, 8.219152450561523, 8.601395606994629, 8.983638763427734, 9.365880966186523, 9.748123168945312, 10.130366325378418, 10.512609481811523, 10.894851684570312]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 2.0, 12.0, 11.0, 16.0, 11.0, 20.0, 24.0, 20.0, 31.0, 35.0, 34.0, 42.0, 42.0, 45.0, 42.0, 51.0, 47.0, 38.0, 50.0, 49.0, 39.0, 50.0, 38.0, 44.0, 31.0, 31.0, 29.0, 30.0, 19.0, 20.0, 13.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.347925186157227, -5.161818504333496, -4.975711345672607, -4.789604663848877, -4.6034979820251465, -4.417390823364258, -4.231284141540527, -4.045177459716797, -3.859070301055908, -3.6729633808135986, -3.486856698989868, -3.3007497787475586, -3.114642858505249, -2.9285359382629395, -2.742429256439209, -2.5563223361968994, -2.370215654373169, -2.1841087341308594, -1.9980019330978394, -1.8118951320648193, -1.6257882118225098, -1.4396814107894897, -1.2535746097564697, -1.0674676895141602, -0.8813608884811401, -0.6952540278434753, -0.5091471672058105, -0.3230403661727905, -0.13693350553512573, 0.04917335510253906, 0.23528015613555908, 0.42138707637786865, 0.6074938774108887, 0.7936007380485535, 0.9797075986862183, 1.1658143997192383, 1.3519213199615479, 1.5380281209945679, 1.724134922027588, 1.9102418422698975, 2.096348762512207, 2.2824556827545166, 2.468562364578247, 2.6546692848205566, 2.840776205062866, 3.026883125305176, 3.2129898071289062, 3.399096727371216, 3.5852034091949463, 3.771310329437256, 3.9574170112609863, 4.143524169921875, 4.3296308517456055, 4.515737533569336, 4.701844215393066, 4.887951374053955, 5.0740580558776855, 5.260164737701416, 5.446271896362305, 5.632378578186035, 5.818485260009766, 6.004592418670654, 6.190699100494385, 6.376806259155273, 6.562912940979004]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 5.0, 3.0, 13.0, 17.0, 20.0, 26.0, 47.0, 71.0, 122.0, 177.0, 334.0, 530.0, 896.0, 1571.0, 2752.0, 5146.0, 9487.0, 17565.0, 32729.0, 60600.0, 111705.0, 207807.0, 267520.0, 150847.0, 82172.0, 44268.0, 23792.0, 12760.0, 6780.0, 3816.0, 2066.0, 1214.0, 677.0, 366.0, 263.0, 143.0, 98.0, 49.0, 38.0, 16.0, 17.0, 13.0, 6.0, 9.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.587890625, -2.50762939453125, -2.4273681640625, -2.34710693359375, -2.266845703125, -2.18658447265625, -2.1063232421875, -2.02606201171875, -1.94580078125, -1.86553955078125, -1.7852783203125, -1.70501708984375, -1.624755859375, -1.54449462890625, -1.4642333984375, -1.38397216796875, -1.3037109375, -1.22344970703125, -1.1431884765625, -1.06292724609375, -0.982666015625, -0.90240478515625, -0.8221435546875, -0.74188232421875, -0.66162109375, -0.58135986328125, -0.5010986328125, -0.42083740234375, -0.340576171875, -0.26031494140625, -0.1800537109375, -0.09979248046875, -0.01953125, 0.06072998046875, 0.1409912109375, 0.22125244140625, 0.301513671875, 0.38177490234375, 0.4620361328125, 0.54229736328125, 0.62255859375, 0.70281982421875, 0.7830810546875, 0.86334228515625, 0.943603515625, 1.02386474609375, 1.1041259765625, 1.18438720703125, 1.2646484375, 1.34490966796875, 1.4251708984375, 1.50543212890625, 1.585693359375, 1.66595458984375, 1.7462158203125, 1.82647705078125, 1.90673828125, 1.98699951171875, 2.0672607421875, 2.14752197265625, 2.227783203125, 2.30804443359375, 2.3883056640625, 2.46856689453125, 2.548828125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 9.0, 4.0, 9.0, 7.0, 12.0, 19.0, 22.0, 36.0, 32.0, 47.0, 58.0, 49.0, 56.0, 53.0, 58.0, 56.0, 68.0, 53.0, 53.0, 51.0, 46.0, 36.0, 42.0, 34.0, 26.0, 16.0, 16.0, 14.0, 9.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82080078125, -0.7954635620117188, -0.7701263427734375, -0.7447891235351562, -0.719451904296875, -0.6941146850585938, -0.6687774658203125, -0.6434402465820312, -0.61810302734375, -0.5927658081054688, -0.5674285888671875, -0.5420913696289062, -0.516754150390625, -0.49141693115234375, -0.4660797119140625, -0.44074249267578125, -0.4154052734375, -0.39006805419921875, -0.3647308349609375, -0.33939361572265625, -0.314056396484375, -0.28871917724609375, -0.2633819580078125, -0.23804473876953125, -0.21270751953125, -0.18737030029296875, -0.1620330810546875, -0.13669586181640625, -0.111358642578125, -0.08602142333984375, -0.0606842041015625, -0.03534698486328125, -0.010009765625, 0.01532745361328125, 0.0406646728515625, 0.06600189208984375, 0.091339111328125, 0.11667633056640625, 0.1420135498046875, 0.16735076904296875, 0.19268798828125, 0.21802520751953125, 0.2433624267578125, 0.26869964599609375, 0.294036865234375, 0.31937408447265625, 0.3447113037109375, 0.37004852294921875, 0.3953857421875, 0.42072296142578125, 0.4460601806640625, 0.47139739990234375, 0.496734619140625, 0.5220718383789062, 0.5474090576171875, 0.5727462768554688, 0.59808349609375, 0.6234207153320312, 0.6487579345703125, 0.6740951538085938, 0.699432373046875, 0.7247695922851562, 0.7501068115234375, 0.7754440307617188, 0.80078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 20.0, 22.0, 25.0, 38.0, 74.0, 122.0, 229.0, 546.0, 1529.0, 9175.0, 142667.0, 795326.0, 90043.0, 6557.0, 1280.0, 420.0, 175.0, 112.0, 72.0, 38.0, 22.0, 19.0, 9.0, 6.0, 8.0, 6.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -11.077880859375, -10.76513671875, -10.452392578125, -10.1396484375, -9.826904296875, -9.51416015625, -9.201416015625, -8.888671875, -8.575927734375, -8.26318359375, -7.950439453125, -7.6376953125, -7.324951171875, -7.01220703125, -6.699462890625, -6.38671875, -6.073974609375, -5.76123046875, -5.448486328125, -5.1357421875, -4.822998046875, -4.51025390625, -4.197509765625, -3.884765625, -3.572021484375, -3.25927734375, -2.946533203125, -2.6337890625, -2.321044921875, -2.00830078125, -1.695556640625, -1.3828125, -1.070068359375, -0.75732421875, -0.444580078125, -0.1318359375, 0.180908203125, 0.49365234375, 0.806396484375, 1.119140625, 1.431884765625, 1.74462890625, 2.057373046875, 2.3701171875, 2.682861328125, 2.99560546875, 3.308349609375, 3.62109375, 3.933837890625, 4.24658203125, 4.559326171875, 4.8720703125, 5.184814453125, 5.49755859375, 5.810302734375, 6.123046875, 6.435791015625, 6.74853515625, 7.061279296875, 7.3740234375, 7.686767578125, 7.99951171875, 8.312255859375, 8.625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 11.0, 9.0, 17.0, 16.0, 29.0, 18.0, 24.0, 32.0, 40.0, 36.0, 22.0, 32.0, 43.0, 43.0, 51.0, 54.0, 53.0, 50.0, 50.0, 37.0, 37.0, 31.0, 41.0, 35.0, 28.0, 16.0, 20.0, 21.0, 24.0, 14.0, 15.0, 9.0, 3.0, 1.0, 8.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.099609375, -3.00634765625, -2.9130859375, -2.81982421875, -2.7265625, -2.63330078125, -2.5400390625, -2.44677734375, -2.353515625, -2.26025390625, -2.1669921875, -2.07373046875, -1.98046875, -1.88720703125, -1.7939453125, -1.70068359375, -1.607421875, -1.51416015625, -1.4208984375, -1.32763671875, -1.234375, -1.14111328125, -1.0478515625, -0.95458984375, -0.861328125, -0.76806640625, -0.6748046875, -0.58154296875, -0.48828125, -0.39501953125, -0.3017578125, -0.20849609375, -0.115234375, -0.02197265625, 0.0712890625, 0.16455078125, 0.2578125, 0.35107421875, 0.4443359375, 0.53759765625, 0.630859375, 0.72412109375, 0.8173828125, 0.91064453125, 1.00390625, 1.09716796875, 1.1904296875, 1.28369140625, 1.376953125, 1.47021484375, 1.5634765625, 1.65673828125, 1.75, 1.84326171875, 1.9365234375, 2.02978515625, 2.123046875, 2.21630859375, 2.3095703125, 2.40283203125, 2.49609375, 2.58935546875, 2.6826171875, 2.77587890625, 2.869140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 6.0, 10.0, 15.0, 16.0, 28.0, 58.0, 77.0, 136.0, 223.0, 376.0, 671.0, 1311.0, 2501.0, 5792.0, 14468.0, 45347.0, 217399.0, 598252.0, 113662.0, 29253.0, 10354.0, 4313.0, 1959.0, 972.0, 552.0, 305.0, 177.0, 110.0, 76.0, 45.0, 35.0, 22.0, 13.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.29296875, -3.1806640625, -3.068359375, -2.9560546875, -2.84375, -2.7314453125, -2.619140625, -2.5068359375, -2.39453125, -2.2822265625, -2.169921875, -2.0576171875, -1.9453125, -1.8330078125, -1.720703125, -1.6083984375, -1.49609375, -1.3837890625, -1.271484375, -1.1591796875, -1.046875, -0.9345703125, -0.822265625, -0.7099609375, -0.59765625, -0.4853515625, -0.373046875, -0.2607421875, -0.1484375, -0.0361328125, 0.076171875, 0.1884765625, 0.30078125, 0.4130859375, 0.525390625, 0.6376953125, 0.75, 0.8623046875, 0.974609375, 1.0869140625, 1.19921875, 1.3115234375, 1.423828125, 1.5361328125, 1.6484375, 1.7607421875, 1.873046875, 1.9853515625, 2.09765625, 2.2099609375, 2.322265625, 2.4345703125, 2.546875, 2.6591796875, 2.771484375, 2.8837890625, 2.99609375, 3.1083984375, 3.220703125, 3.3330078125, 3.4453125, 3.5576171875, 3.669921875, 3.7822265625, 3.89453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 15.0, 13.0, 18.0, 31.0, 50.0, 56.0, 110.0, 209.0, 225.0, 96.0, 47.0, 34.0, 27.0, 17.0, 11.0, 11.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008115768432617188, -0.0007814615964889526, -0.0007513463497161865, -0.0007212311029434204, -0.0006911158561706543, -0.0006610006093978882, -0.0006308853626251221, -0.000600770115852356, -0.0005706548690795898, -0.0005405396223068237, -0.0005104243755340576, -0.0004803091287612915, -0.0004501938819885254, -0.0004200786352157593, -0.00038996338844299316, -0.00035984814167022705, -0.00032973289489746094, -0.0002996176481246948, -0.0002695024013519287, -0.0002393871545791626, -0.00020927190780639648, -0.00017915666103363037, -0.00014904141426086426, -0.00011892616748809814, -8.881092071533203e-05, -5.869567394256592e-05, -2.8580427169799805e-05, 1.5348196029663086e-06, 3.165006637573242e-05, 6.176531314849854e-05, 9.188055992126465e-05, 0.00012199580669403076, 0.00015211105346679688, 0.000182226300239563, 0.0002123415470123291, 0.00024245679378509521, 0.00027257204055786133, 0.00030268728733062744, 0.00033280253410339355, 0.00036291778087615967, 0.0003930330276489258, 0.0004231482744216919, 0.000453263521194458, 0.0004833787679672241, 0.0005134940147399902, 0.0005436092615127563, 0.0005737245082855225, 0.0006038397550582886, 0.0006339550018310547, 0.0006640702486038208, 0.0006941854953765869, 0.000724300742149353, 0.0007544159889221191, 0.0007845312356948853, 0.0008146464824676514, 0.0008447617292404175, 0.0008748769760131836, 0.0009049922227859497, 0.0009351074695587158, 0.0009652227163314819, 0.000995337963104248, 0.0010254532098770142, 0.0010555684566497803, 0.0010856837034225464, 0.0011157989501953125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 14.0, 11.0, 12.0, 28.0, 57.0, 75.0, 139.0, 258.0, 574.0, 1313.0, 3851.0, 13252.0, 62585.0, 696925.0, 228228.0, 29704.0, 7481.0, 2344.0, 825.0, 367.0, 203.0, 132.0, 51.0, 44.0, 28.0, 16.0, 10.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2734375, -6.09808349609375, -5.9227294921875, -5.74737548828125, -5.572021484375, -5.39666748046875, -5.2213134765625, -5.04595947265625, -4.87060546875, -4.69525146484375, -4.5198974609375, -4.34454345703125, -4.169189453125, -3.99383544921875, -3.8184814453125, -3.64312744140625, -3.4677734375, -3.29241943359375, -3.1170654296875, -2.94171142578125, -2.766357421875, -2.59100341796875, -2.4156494140625, -2.24029541015625, -2.06494140625, -1.88958740234375, -1.7142333984375, -1.53887939453125, -1.363525390625, -1.18817138671875, -1.0128173828125, -0.83746337890625, -0.662109375, -0.48675537109375, -0.3114013671875, -0.13604736328125, 0.039306640625, 0.21466064453125, 0.3900146484375, 0.56536865234375, 0.74072265625, 0.91607666015625, 1.0914306640625, 1.26678466796875, 1.442138671875, 1.61749267578125, 1.7928466796875, 1.96820068359375, 2.1435546875, 2.31890869140625, 2.4942626953125, 2.66961669921875, 2.844970703125, 3.02032470703125, 3.1956787109375, 3.37103271484375, 3.54638671875, 3.72174072265625, 3.8970947265625, 4.07244873046875, 4.247802734375, 4.42315673828125, 4.5985107421875, 4.77386474609375, 4.94921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 8.0, 12.0, 9.0, 15.0, 19.0, 36.0, 43.0, 72.0, 117.0, 156.0, 171.0, 100.0, 64.0, 43.0, 22.0, 20.0, 21.0, 14.0, 8.0, 8.0, 4.0, 4.0, 4.0, 6.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-3.76953125, -3.667205810546875, -3.56488037109375, -3.462554931640625, -3.3602294921875, -3.257904052734375, -3.15557861328125, -3.053253173828125, -2.950927734375, -2.848602294921875, -2.74627685546875, -2.643951416015625, -2.5416259765625, -2.439300537109375, -2.33697509765625, -2.234649658203125, -2.13232421875, -2.029998779296875, -1.92767333984375, -1.825347900390625, -1.7230224609375, -1.620697021484375, -1.51837158203125, -1.416046142578125, -1.313720703125, -1.211395263671875, -1.10906982421875, -1.006744384765625, -0.9044189453125, -0.802093505859375, -0.69976806640625, -0.597442626953125, -0.4951171875, -0.392791748046875, -0.29046630859375, -0.188140869140625, -0.0858154296875, 0.016510009765625, 0.11883544921875, 0.221160888671875, 0.323486328125, 0.425811767578125, 0.52813720703125, 0.630462646484375, 0.7327880859375, 0.835113525390625, 0.93743896484375, 1.039764404296875, 1.14208984375, 1.244415283203125, 1.34674072265625, 1.449066162109375, 1.5513916015625, 1.653717041015625, 1.75604248046875, 1.858367919921875, 1.960693359375, 2.063018798828125, 2.16534423828125, 2.267669677734375, 2.3699951171875, 2.472320556640625, 2.57464599609375, 2.676971435546875, 2.779296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 22.0, 61.0, 74.0, 114.0, 161.0, 170.0, 154.0, 86.0, 67.0, 44.0, 11.0, 12.0, 8.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.995370864868164, -30.62091827392578, -29.246463775634766, -27.872011184692383, -26.497556686401367, -25.123104095458984, -23.74864959716797, -22.374197006225586, -20.999744415283203, -19.62529182434082, -18.250837326049805, -16.876384735107422, -15.501930236816406, -14.127477645874023, -12.753024101257324, -11.378570556640625, -10.00411605834961, -8.62966251373291, -7.255208969116211, -5.88075590133667, -4.506302356719971, -3.1318488121032715, -1.7573957443237305, -0.38294219970703125, 0.991511344909668, 2.365964889526367, 3.7404181957244873, 5.114871501922607, 6.489325046539307, 7.863778591156006, 9.238231658935547, 10.612685203552246, 11.987140655517578, 13.361594200134277, 14.736047744750977, 16.11050033569336, 17.484954833984375, 18.859407424926758, 20.23386001586914, 21.608314514160156, 22.982769012451172, 24.357221603393555, 25.73167610168457, 27.106128692626953, 28.48058319091797, 29.85503578186035, 31.229488372802734, 32.60394287109375, 33.9783935546875, 35.352848052978516, 36.727298736572266, 38.10175323486328, 39.4762077331543, 40.85066223144531, 42.22511291503906, 43.59956741333008, 44.974021911621094, 46.34847640991211, 47.72292709350586, 49.097381591796875, 50.47183609008789, 51.846290588378906, 53.220741271972656, 54.59519577026367, 55.96965026855469]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 11.0, 15.0, 20.0, 21.0, 22.0, 24.0, 26.0, 34.0, 30.0, 42.0, 47.0, 45.0, 47.0, 43.0, 61.0, 49.0, 47.0, 44.0, 53.0, 40.0, 40.0, 32.0, 39.0, 35.0, 15.0, 16.0, 27.0, 15.0, 13.0, 7.0, 8.0, 4.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.719343185424805, -17.106679916381836, -16.494016647338867, -15.881353378295898, -15.26869010925293, -14.656026840209961, -14.043363571166992, -13.430700302124023, -12.818037033081055, -12.205373764038086, -11.592710494995117, -10.980047225952148, -10.36738395690918, -9.754720687866211, -9.142057418823242, -8.529394149780273, -7.916730880737305, -7.304067611694336, -6.691404342651367, -6.078741073608398, -5.46607780456543, -4.853414535522461, -4.240751266479492, -3.6280879974365234, -3.0154247283935547, -2.402761459350586, -1.7900981903076172, -1.1774349212646484, -0.5647716522216797, 0.04789161682128906, 0.6605548858642578, 1.2732181549072266, 1.8858795166015625, 2.4985427856445312, 3.1112060546875, 3.7238693237304688, 4.3365325927734375, 4.949195861816406, 5.561859130859375, 6.174522399902344, 6.7871856689453125, 7.399848937988281, 8.01251220703125, 8.625175476074219, 9.237838745117188, 9.850502014160156, 10.463165283203125, 11.075828552246094, 11.688491821289062, 12.301155090332031, 12.913818359375, 13.526481628417969, 14.139144897460938, 14.751808166503906, 15.364471435546875, 15.977134704589844, 16.589797973632812, 17.20246124267578, 17.81512451171875, 18.42778778076172, 19.040451049804688, 19.653114318847656, 20.265777587890625, 20.878440856933594, 21.491104125976562]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 0.0, 9.0, 6.0, 7.0, 11.0, 21.0, 29.0, 42.0, 63.0, 95.0, 150.0, 276.0, 392.0, 729.0, 1271.0, 2528.0, 4877.0, 10789.0, 26067.0, 75473.0, 307600.0, 3224878.0, 397560.0, 88200.0, 29897.0, 11971.0, 5455.0, 2698.0, 1381.0, 739.0, 445.0, 240.0, 152.0, 81.0, 43.0, 40.0, 21.0, 20.0, 7.0, 7.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-3.9453125, -3.834381103515625, -3.72344970703125, -3.612518310546875, -3.5015869140625, -3.390655517578125, -3.27972412109375, -3.168792724609375, -3.057861328125, -2.946929931640625, -2.83599853515625, -2.725067138671875, -2.6141357421875, -2.503204345703125, -2.39227294921875, -2.281341552734375, -2.17041015625, -2.059478759765625, -1.94854736328125, -1.837615966796875, -1.7266845703125, -1.615753173828125, -1.50482177734375, -1.393890380859375, -1.282958984375, -1.172027587890625, -1.06109619140625, -0.950164794921875, -0.8392333984375, -0.728302001953125, -0.61737060546875, -0.506439208984375, -0.3955078125, -0.284576416015625, -0.17364501953125, -0.062713623046875, 0.0482177734375, 0.159149169921875, 0.27008056640625, 0.381011962890625, 0.491943359375, 0.602874755859375, 0.71380615234375, 0.824737548828125, 0.9356689453125, 1.046600341796875, 1.15753173828125, 1.268463134765625, 1.37939453125, 1.490325927734375, 1.60125732421875, 1.712188720703125, 1.8231201171875, 1.934051513671875, 2.04498291015625, 2.155914306640625, 2.266845703125, 2.377777099609375, 2.48870849609375, 2.599639892578125, 2.7105712890625, 2.821502685546875, 2.93243408203125, 3.043365478515625, 3.154296875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 9.0, 6.0, 9.0, 8.0, 12.0, 33.0, 14.0, 35.0, 44.0, 39.0, 43.0, 74.0, 50.0, 63.0, 65.0, 58.0, 58.0, 60.0, 50.0, 41.0, 49.0, 40.0, 27.0, 20.0, 25.0, 15.0, 14.0, 9.0, 6.0, 5.0, 10.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.994140625, -0.9664154052734375, -0.938690185546875, -0.9109649658203125, -0.88323974609375, -0.8555145263671875, -0.827789306640625, -0.8000640869140625, -0.7723388671875, -0.7446136474609375, -0.716888427734375, -0.6891632080078125, -0.66143798828125, -0.6337127685546875, -0.605987548828125, -0.5782623291015625, -0.550537109375, -0.5228118896484375, -0.495086669921875, -0.4673614501953125, -0.43963623046875, -0.4119110107421875, -0.384185791015625, -0.3564605712890625, -0.3287353515625, -0.3010101318359375, -0.273284912109375, -0.2455596923828125, -0.21783447265625, -0.1901092529296875, -0.162384033203125, -0.1346588134765625, -0.10693359375, -0.0792083740234375, -0.051483154296875, -0.0237579345703125, 0.00396728515625, 0.0316925048828125, 0.059417724609375, 0.0871429443359375, 0.1148681640625, 0.1425933837890625, 0.170318603515625, 0.1980438232421875, 0.22576904296875, 0.2534942626953125, 0.281219482421875, 0.3089447021484375, 0.336669921875, 0.3643951416015625, 0.392120361328125, 0.4198455810546875, 0.44757080078125, 0.4752960205078125, 0.503021240234375, 0.5307464599609375, 0.5584716796875, 0.5861968994140625, 0.613922119140625, 0.6416473388671875, 0.66937255859375, 0.6970977783203125, 0.724822998046875, 0.7525482177734375, 0.7802734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 6.0, 5.0, 14.0, 12.0, 20.0, 19.0, 33.0, 50.0, 72.0, 105.0, 166.0, 242.0, 318.0, 581.0, 864.0, 1536.0, 2635.0, 4954.0, 9238.0, 18621.0, 39799.0, 101385.0, 337055.0, 2589875.0, 799047.0, 170995.0, 61911.0, 26410.0, 12708.0, 6629.0, 3500.0, 2067.0, 1257.0, 750.0, 478.0, 310.0, 207.0, 129.0, 90.0, 56.0, 47.0, 34.0, 22.0, 9.0, 13.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.814453125, -2.722900390625, -2.63134765625, -2.539794921875, -2.4482421875, -2.356689453125, -2.26513671875, -2.173583984375, -2.08203125, -1.990478515625, -1.89892578125, -1.807373046875, -1.7158203125, -1.624267578125, -1.53271484375, -1.441162109375, -1.349609375, -1.258056640625, -1.16650390625, -1.074951171875, -0.9833984375, -0.891845703125, -0.80029296875, -0.708740234375, -0.6171875, -0.525634765625, -0.43408203125, -0.342529296875, -0.2509765625, -0.159423828125, -0.06787109375, 0.023681640625, 0.115234375, 0.206787109375, 0.29833984375, 0.389892578125, 0.4814453125, 0.572998046875, 0.66455078125, 0.756103515625, 0.84765625, 0.939208984375, 1.03076171875, 1.122314453125, 1.2138671875, 1.305419921875, 1.39697265625, 1.488525390625, 1.580078125, 1.671630859375, 1.76318359375, 1.854736328125, 1.9462890625, 2.037841796875, 2.12939453125, 2.220947265625, 2.3125, 2.404052734375, 2.49560546875, 2.587158203125, 2.6787109375, 2.770263671875, 2.86181640625, 2.953369140625, 3.044921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 18.0, 8.0, 19.0, 24.0, 22.0, 48.0, 49.0, 80.0, 135.0, 208.0, 387.0, 1136.0, 992.0, 352.0, 175.0, 120.0, 89.0, 54.0, 42.0, 25.0, 16.0, 16.0, 10.0, 7.0, 9.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5849609375, -1.5214691162109375, -1.457977294921875, -1.3944854736328125, -1.33099365234375, -1.2675018310546875, -1.204010009765625, -1.1405181884765625, -1.0770263671875, -1.0135345458984375, -0.950042724609375, -0.8865509033203125, -0.82305908203125, -0.7595672607421875, -0.696075439453125, -0.6325836181640625, -0.569091796875, -0.5055999755859375, -0.442108154296875, -0.3786163330078125, -0.31512451171875, -0.2516326904296875, -0.188140869140625, -0.1246490478515625, -0.0611572265625, 0.0023345947265625, 0.065826416015625, 0.1293182373046875, 0.19281005859375, 0.2563018798828125, 0.319793701171875, 0.3832855224609375, 0.44677734375, 0.5102691650390625, 0.573760986328125, 0.6372528076171875, 0.70074462890625, 0.7642364501953125, 0.827728271484375, 0.8912200927734375, 0.9547119140625, 1.0182037353515625, 1.081695556640625, 1.1451873779296875, 1.20867919921875, 1.2721710205078125, 1.335662841796875, 1.3991546630859375, 1.462646484375, 1.5261383056640625, 1.589630126953125, 1.6531219482421875, 1.71661376953125, 1.7801055908203125, 1.843597412109375, 1.9070892333984375, 1.9705810546875, 2.0340728759765625, 2.097564697265625, 2.1610565185546875, 2.22454833984375, 2.2880401611328125, 2.351531982421875, 2.4150238037109375, 2.478515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 8.0, 7.0, 16.0, 29.0, 25.0, 47.0, 65.0, 132.0, 132.0, 126.0, 118.0, 98.0, 71.0, 40.0, 38.0, 20.0, 12.0, 11.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.026500701904297, -19.574810028076172, -19.123119354248047, -18.671428680419922, -18.219738006591797, -17.768047332763672, -17.316356658935547, -16.864665985107422, -16.412975311279297, -15.961284637451172, -15.509593963623047, -15.057903289794922, -14.606212615966797, -14.154521942138672, -13.702831268310547, -13.251140594482422, -12.799449920654297, -12.347759246826172, -11.896068572998047, -11.444377899169922, -10.992687225341797, -10.540996551513672, -10.089305877685547, -9.637615203857422, -9.185924530029297, -8.734233856201172, -8.282543182373047, -7.830852508544922, -7.379161834716797, -6.927471160888672, -6.475780487060547, -6.024089813232422, -5.572399139404297, -5.120708465576172, -4.669017791748047, -4.217327117919922, -3.765636444091797, -3.313945770263672, -2.862255096435547, -2.410564422607422, -1.9588737487792969, -1.5071830749511719, -1.0554924011230469, -0.6038017272949219, -0.15211105346679688, 0.2995796203613281, 0.7512702941894531, 1.2029609680175781, 1.6546516418457031, 2.106342315673828, 2.558032989501953, 3.009723663330078, 3.461414337158203, 3.913105010986328, 4.364795684814453, 4.816486358642578, 5.268177032470703, 5.719867706298828, 6.171558380126953, 6.623249053955078, 7.074939727783203, 7.526630401611328, 7.978321075439453, 8.430011749267578, 8.881702423095703]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 8.0, 15.0, 22.0, 16.0, 25.0, 23.0, 29.0, 50.0, 31.0, 51.0, 58.0, 54.0, 53.0, 43.0, 49.0, 56.0, 44.0, 45.0, 45.0, 33.0, 45.0, 31.0, 28.0, 19.0, 24.0, 16.0, 20.0, 12.0, 13.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.392812728881836, -9.133866310119629, -8.874920845031738, -8.615974426269531, -8.35702896118164, -8.098082542419434, -7.839136600494385, -7.580190658569336, -7.321244716644287, -7.062298774719238, -6.8033528327941895, -6.544406890869141, -6.285460472106934, -6.026515007019043, -5.767568588256836, -5.508622646331787, -5.249676704406738, -4.9907307624816895, -4.731784820556641, -4.472838878631592, -4.213892936706543, -3.954946756362915, -3.696000576019287, -3.4370546340942383, -3.1781086921691895, -2.9191627502441406, -2.660216808319092, -2.401270627975464, -2.142324686050415, -1.8833787441253662, -1.6244326829910278, -1.3654866218566895, -1.106541633605957, -0.8475956320762634, -0.5886496305465698, -0.3297036290168762, -0.07075762748718262, 0.1881883144378662, 0.4471343755722046, 0.706080436706543, 0.9650263786315918, 1.2239723205566406, 1.482918381690979, 1.7418644428253174, 2.000810384750366, 2.259756326675415, 2.518702507019043, 2.777648448944092, 3.0365943908691406, 3.2955403327941895, 3.5544862747192383, 3.813432455062866, 4.072378158569336, 4.331324577331543, 4.590270519256592, 4.849216461181641, 5.1081624031066895, 5.367108345031738, 5.626054286956787, 5.885000228881836, 6.143946647644043, 6.402892112731934, 6.661838531494141, 6.9207844734191895, 7.179730415344238]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 7.0, 6.0, 6.0, 11.0, 21.0, 33.0, 47.0, 85.0, 146.0, 195.0, 327.0, 525.0, 845.0, 1473.0, 2755.0, 4791.0, 8614.0, 15775.0, 29080.0, 57851.0, 136827.0, 418784.0, 211680.0, 77024.0, 37376.0, 19822.0, 10666.0, 6007.0, 3274.0, 1824.0, 1066.0, 657.0, 365.0, 212.0, 116.0, 93.0, 52.0, 35.0, 23.0, 9.0, 12.0, 14.0, 7.0, 6.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.359375, -3.26251220703125, -3.1656494140625, -3.06878662109375, -2.971923828125, -2.87506103515625, -2.7781982421875, -2.68133544921875, -2.58447265625, -2.48760986328125, -2.3907470703125, -2.29388427734375, -2.197021484375, -2.10015869140625, -2.0032958984375, -1.90643310546875, -1.8095703125, -1.71270751953125, -1.6158447265625, -1.51898193359375, -1.422119140625, -1.32525634765625, -1.2283935546875, -1.13153076171875, -1.03466796875, -0.93780517578125, -0.8409423828125, -0.74407958984375, -0.647216796875, -0.55035400390625, -0.4534912109375, -0.35662841796875, -0.259765625, -0.16290283203125, -0.0660400390625, 0.03082275390625, 0.127685546875, 0.22454833984375, 0.3214111328125, 0.41827392578125, 0.51513671875, 0.61199951171875, 0.7088623046875, 0.80572509765625, 0.902587890625, 0.99945068359375, 1.0963134765625, 1.19317626953125, 1.2900390625, 1.38690185546875, 1.4837646484375, 1.58062744140625, 1.677490234375, 1.77435302734375, 1.8712158203125, 1.96807861328125, 2.06494140625, 2.16180419921875, 2.2586669921875, 2.35552978515625, 2.452392578125, 2.54925537109375, 2.6461181640625, 2.74298095703125, 2.83984375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 9.0, 7.0, 12.0, 6.0, 13.0, 26.0, 26.0, 26.0, 33.0, 24.0, 43.0, 47.0, 55.0, 58.0, 52.0, 50.0, 58.0, 45.0, 53.0, 52.0, 43.0, 36.0, 45.0, 20.0, 36.0, 25.0, 16.0, 15.0, 9.0, 12.0, 10.0, 4.0, 9.0, 12.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8984375, -0.8741455078125, -0.849853515625, -0.8255615234375, -0.80126953125, -0.7769775390625, -0.752685546875, -0.7283935546875, -0.7041015625, -0.6798095703125, -0.655517578125, -0.6312255859375, -0.60693359375, -0.5826416015625, -0.558349609375, -0.5340576171875, -0.509765625, -0.4854736328125, -0.461181640625, -0.4368896484375, -0.41259765625, -0.3883056640625, -0.364013671875, -0.3397216796875, -0.3154296875, -0.2911376953125, -0.266845703125, -0.2425537109375, -0.21826171875, -0.1939697265625, -0.169677734375, -0.1453857421875, -0.12109375, -0.0968017578125, -0.072509765625, -0.0482177734375, -0.02392578125, 0.0003662109375, 0.024658203125, 0.0489501953125, 0.0732421875, 0.0975341796875, 0.121826171875, 0.1461181640625, 0.17041015625, 0.1947021484375, 0.218994140625, 0.2432861328125, 0.267578125, 0.2918701171875, 0.316162109375, 0.3404541015625, 0.36474609375, 0.3890380859375, 0.413330078125, 0.4376220703125, 0.4619140625, 0.4862060546875, 0.510498046875, 0.5347900390625, 0.55908203125, 0.5833740234375, 0.607666015625, 0.6319580078125, 0.65625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 10.0, 11.0, 13.0, 15.0, 22.0, 27.0, 43.0, 61.0, 105.0, 145.0, 256.0, 428.0, 842.0, 2659.0, 12497.0, 86865.0, 780327.0, 139419.0, 18812.0, 3619.0, 1110.0, 483.0, 264.0, 177.0, 115.0, 59.0, 58.0, 21.0, 22.0, 14.0, 20.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.2578125, -8.99029541015625, -8.7227783203125, -8.45526123046875, -8.187744140625, -7.92022705078125, -7.6527099609375, -7.38519287109375, -7.11767578125, -6.85015869140625, -6.5826416015625, -6.31512451171875, -6.047607421875, -5.78009033203125, -5.5125732421875, -5.24505615234375, -4.9775390625, -4.71002197265625, -4.4425048828125, -4.17498779296875, -3.907470703125, -3.63995361328125, -3.3724365234375, -3.10491943359375, -2.83740234375, -2.56988525390625, -2.3023681640625, -2.03485107421875, -1.767333984375, -1.49981689453125, -1.2322998046875, -0.96478271484375, -0.697265625, -0.42974853515625, -0.1622314453125, 0.10528564453125, 0.372802734375, 0.64031982421875, 0.9078369140625, 1.17535400390625, 1.44287109375, 1.71038818359375, 1.9779052734375, 2.24542236328125, 2.512939453125, 2.78045654296875, 3.0479736328125, 3.31549072265625, 3.5830078125, 3.85052490234375, 4.1180419921875, 4.38555908203125, 4.653076171875, 4.92059326171875, 5.1881103515625, 5.45562744140625, 5.72314453125, 5.99066162109375, 6.2581787109375, 6.52569580078125, 6.793212890625, 7.06072998046875, 7.3282470703125, 7.59576416015625, 7.86328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 17.0, 12.0, 11.0, 16.0, 12.0, 20.0, 25.0, 28.0, 26.0, 36.0, 39.0, 37.0, 51.0, 49.0, 47.0, 52.0, 45.0, 57.0, 53.0, 42.0, 41.0, 39.0, 38.0, 33.0, 23.0, 28.0, 24.0, 22.0, 9.0, 12.0, 7.0, 10.0, 3.0, 5.0, 3.0, 5.0, 3.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.572265625, -3.463409423828125, -3.35455322265625, -3.245697021484375, -3.1368408203125, -3.027984619140625, -2.91912841796875, -2.810272216796875, -2.701416015625, -2.592559814453125, -2.48370361328125, -2.374847412109375, -2.2659912109375, -2.157135009765625, -2.04827880859375, -1.939422607421875, -1.83056640625, -1.721710205078125, -1.61285400390625, -1.503997802734375, -1.3951416015625, -1.286285400390625, -1.17742919921875, -1.068572998046875, -0.959716796875, -0.850860595703125, -0.74200439453125, -0.633148193359375, -0.5242919921875, -0.415435791015625, -0.30657958984375, -0.197723388671875, -0.0888671875, 0.019989013671875, 0.12884521484375, 0.237701416015625, 0.3465576171875, 0.455413818359375, 0.56427001953125, 0.673126220703125, 0.781982421875, 0.890838623046875, 0.99969482421875, 1.108551025390625, 1.2174072265625, 1.326263427734375, 1.43511962890625, 1.543975830078125, 1.65283203125, 1.761688232421875, 1.87054443359375, 1.979400634765625, 2.0882568359375, 2.197113037109375, 2.30596923828125, 2.414825439453125, 2.523681640625, 2.632537841796875, 2.74139404296875, 2.850250244140625, 2.9591064453125, 3.067962646484375, 3.17681884765625, 3.285675048828125, 3.39453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 9.0, 9.0, 12.0, 8.0, 19.0, 14.0, 22.0, 35.0, 51.0, 65.0, 117.0, 226.0, 438.0, 835.0, 2065.0, 5863.0, 21369.0, 105855.0, 800512.0, 84536.0, 17819.0, 5103.0, 1811.0, 819.0, 364.0, 214.0, 118.0, 73.0, 38.0, 39.0, 18.0, 18.0, 10.0, 9.0, 6.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-5.91015625, -5.7333984375, -5.556640625, -5.3798828125, -5.203125, -5.0263671875, -4.849609375, -4.6728515625, -4.49609375, -4.3193359375, -4.142578125, -3.9658203125, -3.7890625, -3.6123046875, -3.435546875, -3.2587890625, -3.08203125, -2.9052734375, -2.728515625, -2.5517578125, -2.375, -2.1982421875, -2.021484375, -1.8447265625, -1.66796875, -1.4912109375, -1.314453125, -1.1376953125, -0.9609375, -0.7841796875, -0.607421875, -0.4306640625, -0.25390625, -0.0771484375, 0.099609375, 0.2763671875, 0.453125, 0.6298828125, 0.806640625, 0.9833984375, 1.16015625, 1.3369140625, 1.513671875, 1.6904296875, 1.8671875, 2.0439453125, 2.220703125, 2.3974609375, 2.57421875, 2.7509765625, 2.927734375, 3.1044921875, 3.28125, 3.4580078125, 3.634765625, 3.8115234375, 3.98828125, 4.1650390625, 4.341796875, 4.5185546875, 4.6953125, 4.8720703125, 5.048828125, 5.2255859375, 5.40234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 8.0, 14.0, 20.0, 18.0, 33.0, 47.0, 88.0, 408.0, 155.0, 52.0, 26.0, 30.0, 19.0, 18.0, 13.0, 13.0, 11.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011806488037109375, -0.001145586371421814, -0.0011105239391326904, -0.001075461506843567, -0.0010403990745544434, -0.0010053366422653198, -0.0009702742099761963, -0.0009352117776870728, -0.0009001493453979492, -0.0008650869131088257, -0.0008300244808197021, -0.0007949620485305786, -0.0007598996162414551, -0.0007248371839523315, -0.000689774751663208, -0.0006547123193740845, -0.0006196498870849609, -0.0005845874547958374, -0.0005495250225067139, -0.0005144625902175903, -0.0004794001579284668, -0.00044433772563934326, -0.0004092752933502197, -0.0003742128610610962, -0.00033915042877197266, -0.0003040879964828491, -0.0002690255641937256, -0.00023396313190460205, -0.00019890069961547852, -0.00016383826732635498, -0.00012877583503723145, -9.371340274810791e-05, -5.8650970458984375e-05, -2.358853816986084e-05, 1.1473894119262695e-05, 4.653632640838623e-05, 8.159875869750977e-05, 0.0001166611909866333, 0.00015172362327575684, 0.00018678605556488037, 0.0002218484878540039, 0.00025691092014312744, 0.000291973352432251, 0.0003270357847213745, 0.00036209821701049805, 0.0003971606492996216, 0.0004322230815887451, 0.00046728551387786865, 0.0005023479461669922, 0.0005374103784561157, 0.0005724728107452393, 0.0006075352430343628, 0.0006425976753234863, 0.0006776601076126099, 0.0007127225399017334, 0.0007477849721908569, 0.0007828474044799805, 0.000817909836769104, 0.0008529722690582275, 0.0008880347013473511, 0.0009230971336364746, 0.0009581595659255981, 0.0009932219982147217, 0.0010282844305038452, 0.0010633468627929688]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 8.0, 2.0, 8.0, 6.0, 8.0, 12.0, 16.0, 17.0, 33.0, 61.0, 117.0, 252.0, 589.0, 1775.0, 7691.0, 68640.0, 901735.0, 58036.0, 6786.0, 1657.0, 589.0, 226.0, 106.0, 65.0, 46.0, 20.0, 15.0, 10.0, 13.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0390625, -9.747802734375, -9.45654296875, -9.165283203125, -8.8740234375, -8.582763671875, -8.29150390625, -8.000244140625, -7.708984375, -7.417724609375, -7.12646484375, -6.835205078125, -6.5439453125, -6.252685546875, -5.96142578125, -5.670166015625, -5.37890625, -5.087646484375, -4.79638671875, -4.505126953125, -4.2138671875, -3.922607421875, -3.63134765625, -3.340087890625, -3.048828125, -2.757568359375, -2.46630859375, -2.175048828125, -1.8837890625, -1.592529296875, -1.30126953125, -1.010009765625, -0.71875, -0.427490234375, -0.13623046875, 0.155029296875, 0.4462890625, 0.737548828125, 1.02880859375, 1.320068359375, 1.611328125, 1.902587890625, 2.19384765625, 2.485107421875, 2.7763671875, 3.067626953125, 3.35888671875, 3.650146484375, 3.94140625, 4.232666015625, 4.52392578125, 4.815185546875, 5.1064453125, 5.397705078125, 5.68896484375, 5.980224609375, 6.271484375, 6.562744140625, 6.85400390625, 7.145263671875, 7.4365234375, 7.727783203125, 8.01904296875, 8.310302734375, 8.6015625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 1.0, 4.0, 6.0, 14.0, 7.0, 11.0, 19.0, 19.0, 26.0, 35.0, 78.0, 250.0, 252.0, 96.0, 44.0, 23.0, 27.0, 19.0, 15.0, 13.0, 3.0, 4.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -4.030426025390625, -3.90460205078125, -3.778778076171875, -3.6529541015625, -3.527130126953125, -3.40130615234375, -3.275482177734375, -3.149658203125, -3.023834228515625, -2.89801025390625, -2.772186279296875, -2.6463623046875, -2.520538330078125, -2.39471435546875, -2.268890380859375, -2.14306640625, -2.017242431640625, -1.89141845703125, -1.765594482421875, -1.6397705078125, -1.513946533203125, -1.38812255859375, -1.262298583984375, -1.136474609375, -1.010650634765625, -0.88482666015625, -0.759002685546875, -0.6331787109375, -0.507354736328125, -0.38153076171875, -0.255706787109375, -0.1298828125, -0.004058837890625, 0.12176513671875, 0.247589111328125, 0.3734130859375, 0.499237060546875, 0.62506103515625, 0.750885009765625, 0.876708984375, 1.002532958984375, 1.12835693359375, 1.254180908203125, 1.3800048828125, 1.505828857421875, 1.63165283203125, 1.757476806640625, 1.88330078125, 2.009124755859375, 2.13494873046875, 2.260772705078125, 2.3865966796875, 2.512420654296875, 2.63824462890625, 2.764068603515625, 2.889892578125, 3.015716552734375, 3.14154052734375, 3.267364501953125, 3.3931884765625, 3.519012451171875, 3.64483642578125, 3.770660400390625, 3.896484375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 14.0, 26.0, 55.0, 96.0, 154.0, 208.0, 187.0, 127.0, 85.0, 29.0, 14.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.09597778320312, -67.21365356445312, -65.33132934570312, -63.44900131225586, -61.56667709350586, -59.68435287475586, -57.80202865600586, -55.919700622558594, -54.037376403808594, -52.155052185058594, -50.272727966308594, -48.39039993286133, -46.50807571411133, -44.62575149536133, -42.74342727661133, -40.86109924316406, -38.97877502441406, -37.09645080566406, -35.21412658691406, -33.3317985534668, -31.449474334716797, -29.567150115966797, -27.684825897216797, -25.802499771118164, -23.920177459716797, -22.037853240966797, -20.155527114868164, -18.273202896118164, -16.39087677001953, -14.508552551269531, -12.626227378845215, -10.743902206420898, -8.861576080322266, -6.979250907897949, -5.096925735473633, -3.2146010398864746, -1.3322758674621582, 0.550048828125, 2.4323740005493164, 4.314699172973633, 6.197024345397949, 8.079349517822266, 9.961674690246582, 11.843999862670898, 13.726324081420898, 15.608649253845215, 17.49097442626953, 19.37329864501953, 21.255624771118164, 23.137948989868164, 25.020275115966797, 26.902599334716797, 28.78492546081543, 30.66724967956543, 32.54957580566406, 34.43190002441406, 36.31422424316406, 38.19654846191406, 40.07887268066406, 41.96120071411133, 43.84352493286133, 45.72584915161133, 47.60817337036133, 49.490501403808594, 51.372825622558594]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 9.0, 8.0, 20.0, 16.0, 24.0, 20.0, 35.0, 40.0, 38.0, 40.0, 44.0, 44.0, 47.0, 50.0, 51.0, 45.0, 46.0, 51.0, 37.0, 41.0, 33.0, 36.0, 39.0, 30.0, 31.0, 21.0, 24.0, 13.0, 14.0, 9.0, 10.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.753005981445312, -22.079782485961914, -21.406557083129883, -20.733333587646484, -20.060108184814453, -19.386884689331055, -18.713659286499023, -18.040435791015625, -17.367210388183594, -16.693986892700195, -16.020761489868164, -15.34753704071045, -14.674312591552734, -14.00108814239502, -13.327863693237305, -12.654640197753906, -11.981415748596191, -11.308191299438477, -10.634966850280762, -9.961742401123047, -9.288517951965332, -8.615293502807617, -7.9420695304870605, -7.268845081329346, -6.595620632171631, -5.922396183013916, -5.249171733856201, -4.5759477615356445, -3.9027230739593506, -3.2294986248016357, -2.5562744140625, -1.8830499649047852, -1.2098255157470703, -0.5366011261940002, 0.13662326335906982, 0.8098475933074951, 1.48307204246521, 2.156296491622925, 2.8295207023620605, 3.5027451515197754, 4.17596960067749, 4.849194049835205, 5.52241849899292, 6.195642471313477, 6.868866920471191, 7.542091369628906, 8.215315818786621, 8.888540267944336, 9.56176471710205, 10.234989166259766, 10.90821361541748, 11.581438064575195, 12.25466251373291, 12.927886962890625, 13.601110458374023, 14.274335861206055, 14.947559356689453, 15.620783805847168, 16.294008255004883, 16.96723175048828, 17.640457153320312, 18.31368064880371, 18.986906051635742, 19.66012954711914, 20.333354949951172]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 8.0, 12.0, 17.0, 25.0, 41.0, 97.0, 139.0, 182.0, 320.0, 653.0, 1388.0, 2784.0, 6860.0, 19455.0, 77051.0, 937951.0, 3003859.0, 104084.0, 24925.0, 8313.0, 3296.0, 1389.0, 700.0, 320.0, 162.0, 100.0, 51.0, 32.0, 19.0, 12.0, 8.0, 3.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6953125, -5.517822265625, -5.34033203125, -5.162841796875, -4.9853515625, -4.807861328125, -4.63037109375, -4.452880859375, -4.275390625, -4.097900390625, -3.92041015625, -3.742919921875, -3.5654296875, -3.387939453125, -3.21044921875, -3.032958984375, -2.85546875, -2.677978515625, -2.50048828125, -2.322998046875, -2.1455078125, -1.968017578125, -1.79052734375, -1.613037109375, -1.435546875, -1.258056640625, -1.08056640625, -0.903076171875, -0.7255859375, -0.548095703125, -0.37060546875, -0.193115234375, -0.015625, 0.161865234375, 0.33935546875, 0.516845703125, 0.6943359375, 0.871826171875, 1.04931640625, 1.226806640625, 1.404296875, 1.581787109375, 1.75927734375, 1.936767578125, 2.1142578125, 2.291748046875, 2.46923828125, 2.646728515625, 2.82421875, 3.001708984375, 3.17919921875, 3.356689453125, 3.5341796875, 3.711669921875, 3.88916015625, 4.066650390625, 4.244140625, 4.421630859375, 4.59912109375, 4.776611328125, 4.9541015625, 5.131591796875, 5.30908203125, 5.486572265625, 5.6640625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 6.0, 5.0, 9.0, 8.0, 17.0, 19.0, 24.0, 21.0, 42.0, 34.0, 54.0, 28.0, 37.0, 41.0, 57.0, 41.0, 48.0, 50.0, 42.0, 46.0, 45.0, 45.0, 27.0, 42.0, 29.0, 29.0, 27.0, 20.0, 17.0, 14.0, 14.0, 11.0, 6.0, 9.0, 6.0, 2.0, 1.0, 5.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.9755859375, -0.9503326416015625, -0.925079345703125, -0.8998260498046875, -0.87457275390625, -0.8493194580078125, -0.824066162109375, -0.7988128662109375, -0.7735595703125, -0.7483062744140625, -0.723052978515625, -0.6977996826171875, -0.67254638671875, -0.6472930908203125, -0.622039794921875, -0.5967864990234375, -0.571533203125, -0.5462799072265625, -0.521026611328125, -0.4957733154296875, -0.47052001953125, -0.4452667236328125, -0.420013427734375, -0.3947601318359375, -0.3695068359375, -0.3442535400390625, -0.319000244140625, -0.2937469482421875, -0.26849365234375, -0.2432403564453125, -0.217987060546875, -0.1927337646484375, -0.16748046875, -0.1422271728515625, -0.116973876953125, -0.0917205810546875, -0.06646728515625, -0.0412139892578125, -0.015960693359375, 0.0092926025390625, 0.0345458984375, 0.0597991943359375, 0.085052490234375, 0.1103057861328125, 0.13555908203125, 0.1608123779296875, 0.186065673828125, 0.2113189697265625, 0.236572265625, 0.2618255615234375, 0.287078857421875, 0.3123321533203125, 0.33758544921875, 0.3628387451171875, 0.388092041015625, 0.4133453369140625, 0.4385986328125, 0.4638519287109375, 0.489105224609375, 0.5143585205078125, 0.53961181640625, 0.5648651123046875, 0.590118408203125, 0.6153717041015625, 0.640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 6.0, 6.0, 8.0, 8.0, 11.0, 17.0, 23.0, 14.0, 35.0, 40.0, 46.0, 98.0, 159.0, 330.0, 716.0, 2099.0, 6838.0, 30372.0, 279407.0, 3701187.0, 144071.0, 20848.0, 4976.0, 1612.0, 654.0, 257.0, 125.0, 66.0, 59.0, 31.0, 26.0, 26.0, 16.0, 17.0, 15.0, 19.0, 8.0, 5.0, 4.0, 6.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.3515625, -8.08544921875, -7.8193359375, -7.55322265625, -7.287109375, -7.02099609375, -6.7548828125, -6.48876953125, -6.22265625, -5.95654296875, -5.6904296875, -5.42431640625, -5.158203125, -4.89208984375, -4.6259765625, -4.35986328125, -4.09375, -3.82763671875, -3.5615234375, -3.29541015625, -3.029296875, -2.76318359375, -2.4970703125, -2.23095703125, -1.96484375, -1.69873046875, -1.4326171875, -1.16650390625, -0.900390625, -0.63427734375, -0.3681640625, -0.10205078125, 0.1640625, 0.43017578125, 0.6962890625, 0.96240234375, 1.228515625, 1.49462890625, 1.7607421875, 2.02685546875, 2.29296875, 2.55908203125, 2.8251953125, 3.09130859375, 3.357421875, 3.62353515625, 3.8896484375, 4.15576171875, 4.421875, 4.68798828125, 4.9541015625, 5.22021484375, 5.486328125, 5.75244140625, 6.0185546875, 6.28466796875, 6.55078125, 6.81689453125, 7.0830078125, 7.34912109375, 7.615234375, 7.88134765625, 8.1474609375, 8.41357421875, 8.6796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 8.0, 11.0, 11.0, 17.0, 29.0, 57.0, 116.0, 243.0, 807.0, 2003.0, 417.0, 175.0, 64.0, 44.0, 15.0, 25.0, 15.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.220703125, -2.111114501953125, -2.00152587890625, -1.891937255859375, -1.7823486328125, -1.672760009765625, -1.56317138671875, -1.453582763671875, -1.343994140625, -1.234405517578125, -1.12481689453125, -1.015228271484375, -0.9056396484375, -0.796051025390625, -0.68646240234375, -0.576873779296875, -0.46728515625, -0.357696533203125, -0.24810791015625, -0.138519287109375, -0.0289306640625, 0.080657958984375, 0.19024658203125, 0.299835205078125, 0.409423828125, 0.519012451171875, 0.62860107421875, 0.738189697265625, 0.8477783203125, 0.957366943359375, 1.06695556640625, 1.176544189453125, 1.2861328125, 1.395721435546875, 1.50531005859375, 1.614898681640625, 1.7244873046875, 1.834075927734375, 1.94366455078125, 2.053253173828125, 2.162841796875, 2.272430419921875, 2.38201904296875, 2.491607666015625, 2.6011962890625, 2.710784912109375, 2.82037353515625, 2.929962158203125, 3.03955078125, 3.149139404296875, 3.25872802734375, 3.368316650390625, 3.4779052734375, 3.587493896484375, 3.69708251953125, 3.806671142578125, 3.916259765625, 4.025848388671875, 4.13543701171875, 4.245025634765625, 4.3546142578125, 4.464202880859375, 4.57379150390625, 4.683380126953125, 4.79296875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 6.0, 4.0, 7.0, 10.0, 26.0, 30.0, 44.0, 61.0, 68.0, 83.0, 87.0, 112.0, 95.0, 93.0, 65.0, 65.0, 44.0, 28.0, 26.0, 16.0, 7.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.663066864013672, -10.300556182861328, -9.9380464553833, -9.575535774230957, -9.21302604675293, -8.850515365600586, -8.488004684448242, -8.125494003295898, -7.762984275817871, -7.4004740715026855, -7.0379638671875, -6.675453186035156, -6.312942981719971, -5.950432777404785, -5.587922096252441, -5.225411891937256, -4.86290168762207, -4.500391483306885, -4.137881278991699, -3.7753705978393555, -3.41286039352417, -3.0503501892089844, -2.6878397464752197, -2.325329303741455, -1.9628190994262695, -1.6003087759017944, -1.2377984523773193, -0.8752881288528442, -0.5127778053283691, -0.15026748180389404, 0.21224284172058105, 0.5747532844543457, 0.9372644424438477, 1.2997747659683228, 1.6622850894927979, 2.0247955322265625, 2.387305736541748, 2.7498159408569336, 3.1123263835906982, 3.474836826324463, 3.8373470306396484, 4.199857234954834, 4.5623674392700195, 4.924878120422363, 5.287388324737549, 5.649898529052734, 6.012409210205078, 6.374919414520264, 6.737429618835449, 7.099939823150635, 7.46245002746582, 7.824960708618164, 8.187471389770508, 8.549981117248535, 8.912491798400879, 9.275001525878906, 9.63751220703125, 10.000022888183594, 10.362532615661621, 10.725043296813965, 11.087553024291992, 11.450063705444336, 11.81257438659668, 12.175085067749023, 12.53759479522705]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 8.0, 6.0, 9.0, 12.0, 18.0, 20.0, 10.0, 15.0, 23.0, 21.0, 32.0, 30.0, 28.0, 37.0, 28.0, 38.0, 39.0, 35.0, 37.0, 30.0, 39.0, 34.0, 40.0, 37.0, 37.0, 33.0, 25.0, 28.0, 43.0, 23.0, 21.0, 18.0, 17.0, 21.0, 18.0, 15.0, 15.0, 7.0, 10.0, 4.0, 4.0, 8.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.964675426483154, -5.77907133102417, -5.593467712402344, -5.407863616943359, -5.222259521484375, -5.036655902862549, -4.8510518074035645, -4.665448188781738, -4.479844093322754, -4.2942399978637695, -4.108636379241943, -3.923032283782959, -3.7374284267425537, -3.5518245697021484, -3.366220474243164, -3.180616617202759, -2.9950127601623535, -2.8094089031219482, -2.623805046081543, -2.4382009506225586, -2.2525970935821533, -2.066993236541748, -1.8813892602920532, -1.6957852840423584, -1.5101814270019531, -1.3245775699615479, -1.138973593711853, -0.953369677066803, -0.7677657604217529, -0.5821618437767029, -0.39655792713165283, -0.210953950881958, -0.025350570678710938, 0.1602533459663391, 0.34585726261138916, 0.5314611792564392, 0.7170650959014893, 0.9026690125465393, 1.0882729291915894, 1.2738769054412842, 1.4594807624816895, 1.6450846195220947, 1.8306885957717896, 2.0162925720214844, 2.2018964290618896, 2.387500286102295, 2.5731043815612793, 2.7587082386016846, 2.94431209564209, 3.129915952682495, 3.3155198097229004, 3.5011239051818848, 3.68672776222229, 3.8723316192626953, 4.05793571472168, 4.243539810180664, 4.42914342880249, 4.614747524261475, 4.800351142883301, 4.985955238342285, 5.1715593338012695, 5.357162952423096, 5.54276704788208, 5.728370666503906, 5.913974761962891]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 12.0, 9.0, 7.0, 23.0, 35.0, 59.0, 96.0, 197.0, 335.0, 817.0, 2111.0, 5543.0, 15111.0, 41187.0, 137858.0, 591340.0, 177285.0, 48311.0, 17582.0, 6372.0, 2414.0, 975.0, 409.0, 214.0, 110.0, 57.0, 31.0, 17.0, 15.0, 12.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.5050048828125, -4.357666015625, -4.2103271484375, -4.06298828125, -3.9156494140625, -3.768310546875, -3.6209716796875, -3.4736328125, -3.3262939453125, -3.178955078125, -3.0316162109375, -2.88427734375, -2.7369384765625, -2.589599609375, -2.4422607421875, -2.294921875, -2.1475830078125, -2.000244140625, -1.8529052734375, -1.70556640625, -1.5582275390625, -1.410888671875, -1.2635498046875, -1.1162109375, -0.9688720703125, -0.821533203125, -0.6741943359375, -0.52685546875, -0.3795166015625, -0.232177734375, -0.0848388671875, 0.0625, 0.2098388671875, 0.357177734375, 0.5045166015625, 0.65185546875, 0.7991943359375, 0.946533203125, 1.0938720703125, 1.2412109375, 1.3885498046875, 1.535888671875, 1.6832275390625, 1.83056640625, 1.9779052734375, 2.125244140625, 2.2725830078125, 2.419921875, 2.5672607421875, 2.714599609375, 2.8619384765625, 3.00927734375, 3.1566162109375, 3.303955078125, 3.4512939453125, 3.5986328125, 3.7459716796875, 3.893310546875, 4.0406494140625, 4.18798828125, 4.3353271484375, 4.482666015625, 4.6300048828125, 4.77734375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 8.0, 13.0, 5.0, 18.0, 14.0, 15.0, 21.0, 29.0, 35.0, 36.0, 52.0, 42.0, 52.0, 52.0, 41.0, 48.0, 48.0, 57.0, 39.0, 47.0, 37.0, 44.0, 40.0, 34.0, 23.0, 30.0, 26.0, 20.0, 17.0, 6.0, 14.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0654296875, -1.0360336303710938, -1.0066375732421875, -0.9772415161132812, -0.947845458984375, -0.9184494018554688, -0.8890533447265625, -0.8596572875976562, -0.83026123046875, -0.8008651733398438, -0.7714691162109375, -0.7420730590820312, -0.712677001953125, -0.6832809448242188, -0.6538848876953125, -0.6244888305664062, -0.5950927734375, -0.5656967163085938, -0.5363006591796875, -0.5069046020507812, -0.477508544921875, -0.44811248779296875, -0.4187164306640625, -0.38932037353515625, -0.35992431640625, -0.33052825927734375, -0.3011322021484375, -0.27173614501953125, -0.242340087890625, -0.21294403076171875, -0.1835479736328125, -0.15415191650390625, -0.124755859375, -0.09535980224609375, -0.0659637451171875, -0.03656768798828125, -0.007171630859375, 0.02222442626953125, 0.0516204833984375, 0.08101654052734375, 0.11041259765625, 0.13980865478515625, 0.1692047119140625, 0.19860076904296875, 0.227996826171875, 0.25739288330078125, 0.2867889404296875, 0.31618499755859375, 0.3455810546875, 0.37497711181640625, 0.4043731689453125, 0.43376922607421875, 0.463165283203125, 0.49256134033203125, 0.5219573974609375, 0.5513534545898438, 0.58074951171875, 0.6101455688476562, 0.6395416259765625, 0.6689376831054688, 0.698333740234375, 0.7277297973632812, 0.7571258544921875, 0.7865219116210938, 0.81591796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 13.0, 15.0, 25.0, 29.0, 39.0, 55.0, 69.0, 147.0, 219.0, 389.0, 742.0, 1515.0, 3663.0, 9075.0, 23941.0, 71331.0, 456623.0, 379612.0, 64040.0, 22204.0, 8411.0, 3377.0, 1427.0, 673.0, 321.0, 207.0, 113.0, 85.0, 60.0, 33.0, 21.0, 22.0, 14.0, 11.0, 7.0, 5.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.84375, -4.69677734375, -4.5498046875, -4.40283203125, -4.255859375, -4.10888671875, -3.9619140625, -3.81494140625, -3.66796875, -3.52099609375, -3.3740234375, -3.22705078125, -3.080078125, -2.93310546875, -2.7861328125, -2.63916015625, -2.4921875, -2.34521484375, -2.1982421875, -2.05126953125, -1.904296875, -1.75732421875, -1.6103515625, -1.46337890625, -1.31640625, -1.16943359375, -1.0224609375, -0.87548828125, -0.728515625, -0.58154296875, -0.4345703125, -0.28759765625, -0.140625, 0.00634765625, 0.1533203125, 0.30029296875, 0.447265625, 0.59423828125, 0.7412109375, 0.88818359375, 1.03515625, 1.18212890625, 1.3291015625, 1.47607421875, 1.623046875, 1.77001953125, 1.9169921875, 2.06396484375, 2.2109375, 2.35791015625, 2.5048828125, 2.65185546875, 2.798828125, 2.94580078125, 3.0927734375, 3.23974609375, 3.38671875, 3.53369140625, 3.6806640625, 3.82763671875, 3.974609375, 4.12158203125, 4.2685546875, 4.41552734375, 4.5625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 6.0, 7.0, 10.0, 13.0, 30.0, 24.0, 33.0, 34.0, 35.0, 40.0, 32.0, 45.0, 46.0, 47.0, 58.0, 56.0, 48.0, 53.0, 47.0, 48.0, 46.0, 26.0, 30.0, 25.0, 33.0, 19.0, 26.0, 9.0, 12.0, 9.0, 5.0, 8.0, 6.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.5703125, -4.427001953125, -4.28369140625, -4.140380859375, -3.9970703125, -3.853759765625, -3.71044921875, -3.567138671875, -3.423828125, -3.280517578125, -3.13720703125, -2.993896484375, -2.8505859375, -2.707275390625, -2.56396484375, -2.420654296875, -2.27734375, -2.134033203125, -1.99072265625, -1.847412109375, -1.7041015625, -1.560791015625, -1.41748046875, -1.274169921875, -1.130859375, -0.987548828125, -0.84423828125, -0.700927734375, -0.5576171875, -0.414306640625, -0.27099609375, -0.127685546875, 0.015625, 0.158935546875, 0.30224609375, 0.445556640625, 0.5888671875, 0.732177734375, 0.87548828125, 1.018798828125, 1.162109375, 1.305419921875, 1.44873046875, 1.592041015625, 1.7353515625, 1.878662109375, 2.02197265625, 2.165283203125, 2.30859375, 2.451904296875, 2.59521484375, 2.738525390625, 2.8818359375, 3.025146484375, 3.16845703125, 3.311767578125, 3.455078125, 3.598388671875, 3.74169921875, 3.885009765625, 4.0283203125, 4.171630859375, 4.31494140625, 4.458251953125, 4.6015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 13.0, 13.0, 14.0, 35.0, 72.0, 95.0, 146.0, 282.0, 559.0, 1042.0, 2190.0, 5005.0, 13183.0, 40111.0, 203134.0, 666842.0, 78130.0, 23007.0, 8170.0, 3260.0, 1537.0, 774.0, 409.0, 220.0, 124.0, 75.0, 40.0, 28.0, 16.0, 8.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.376953125, -2.278961181640625, -2.18096923828125, -2.082977294921875, -1.9849853515625, -1.886993408203125, -1.78900146484375, -1.691009521484375, -1.593017578125, -1.495025634765625, -1.39703369140625, -1.299041748046875, -1.2010498046875, -1.103057861328125, -1.00506591796875, -0.907073974609375, -0.80908203125, -0.711090087890625, -0.61309814453125, -0.515106201171875, -0.4171142578125, -0.319122314453125, -0.22113037109375, -0.123138427734375, -0.025146484375, 0.072845458984375, 0.17083740234375, 0.268829345703125, 0.3668212890625, 0.464813232421875, 0.56280517578125, 0.660797119140625, 0.7587890625, 0.856781005859375, 0.95477294921875, 1.052764892578125, 1.1507568359375, 1.248748779296875, 1.34674072265625, 1.444732666015625, 1.542724609375, 1.640716552734375, 1.73870849609375, 1.836700439453125, 1.9346923828125, 2.032684326171875, 2.13067626953125, 2.228668212890625, 2.32666015625, 2.424652099609375, 2.52264404296875, 2.620635986328125, 2.7186279296875, 2.816619873046875, 2.91461181640625, 3.012603759765625, 3.110595703125, 3.208587646484375, 3.30657958984375, 3.404571533203125, 3.5025634765625, 3.600555419921875, 3.69854736328125, 3.796539306640625, 3.89453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 11.0, 10.0, 8.0, 18.0, 17.0, 27.0, 46.0, 228.0, 423.0, 97.0, 27.0, 23.0, 12.0, 13.0, 12.0, 10.0, 5.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013780593872070312, -0.0013377964496612549, -0.0012975335121154785, -0.0012572705745697021, -0.0012170076370239258, -0.0011767446994781494, -0.001136481761932373, -0.0010962188243865967, -0.0010559558868408203, -0.001015692949295044, -0.0009754300117492676, -0.0009351670742034912, -0.0008949041366577148, -0.0008546411991119385, -0.0008143782615661621, -0.0007741153240203857, -0.0007338523864746094, -0.000693589448928833, -0.0006533265113830566, -0.0006130635738372803, -0.0005728006362915039, -0.0005325376987457275, -0.0004922747611999512, -0.0004520118236541748, -0.00041174888610839844, -0.00037148594856262207, -0.0003312230110168457, -0.00029096007347106934, -0.00025069713592529297, -0.0002104341983795166, -0.00017017126083374023, -0.00012990832328796387, -8.96453857421875e-05, -4.938244819641113e-05, -9.119510650634766e-06, 3.11434268951416e-05, 7.140636444091797e-05, 0.00011166930198669434, 0.0001519322395324707, 0.00019219517707824707, 0.00023245811462402344, 0.0002727210521697998, 0.00031298398971557617, 0.00035324692726135254, 0.0003935098648071289, 0.0004337728023529053, 0.00047403573989868164, 0.000514298677444458, 0.0005545616149902344, 0.0005948245525360107, 0.0006350874900817871, 0.0006753504276275635, 0.0007156133651733398, 0.0007558763027191162, 0.0007961392402648926, 0.0008364021778106689, 0.0008766651153564453, 0.0009169280529022217, 0.000957190990447998, 0.0009974539279937744, 0.0010377168655395508, 0.0010779798030853271, 0.0011182427406311035, 0.0011585056781768799, 0.0011987686157226562]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 11.0, 16.0, 23.0, 35.0, 61.0, 77.0, 121.0, 220.0, 311.0, 627.0, 1242.0, 2860.0, 7538.0, 22208.0, 76194.0, 580423.0, 281600.0, 49490.0, 15595.0, 5488.0, 2225.0, 996.0, 469.0, 247.0, 159.0, 100.0, 80.0, 40.0, 32.0, 19.0, 12.0, 7.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.705078125, -2.614410400390625, -2.52374267578125, -2.433074951171875, -2.3424072265625, -2.251739501953125, -2.16107177734375, -2.070404052734375, -1.979736328125, -1.889068603515625, -1.79840087890625, -1.707733154296875, -1.6170654296875, -1.526397705078125, -1.43572998046875, -1.345062255859375, -1.25439453125, -1.163726806640625, -1.07305908203125, -0.982391357421875, -0.8917236328125, -0.801055908203125, -0.71038818359375, -0.619720458984375, -0.529052734375, -0.438385009765625, -0.34771728515625, -0.257049560546875, -0.1663818359375, -0.075714111328125, 0.01495361328125, 0.105621337890625, 0.1962890625, 0.286956787109375, 0.37762451171875, 0.468292236328125, 0.5589599609375, 0.649627685546875, 0.74029541015625, 0.830963134765625, 0.921630859375, 1.012298583984375, 1.10296630859375, 1.193634033203125, 1.2843017578125, 1.374969482421875, 1.46563720703125, 1.556304931640625, 1.64697265625, 1.737640380859375, 1.82830810546875, 1.918975830078125, 2.0096435546875, 2.100311279296875, 2.19097900390625, 2.281646728515625, 2.372314453125, 2.462982177734375, 2.55364990234375, 2.644317626953125, 2.7349853515625, 2.825653076171875, 2.91632080078125, 3.006988525390625, 3.09765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 4.0, 7.0, 12.0, 17.0, 20.0, 17.0, 32.0, 33.0, 55.0, 84.0, 125.0, 138.0, 128.0, 78.0, 63.0, 35.0, 30.0, 22.0, 12.0, 9.0, 13.0, 14.0, 8.0, 8.0, 8.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.232421875, -2.15399169921875, -2.0755615234375, -1.99713134765625, -1.918701171875, -1.84027099609375, -1.7618408203125, -1.68341064453125, -1.60498046875, -1.52655029296875, -1.4481201171875, -1.36968994140625, -1.291259765625, -1.21282958984375, -1.1343994140625, -1.05596923828125, -0.9775390625, -0.89910888671875, -0.8206787109375, -0.74224853515625, -0.663818359375, -0.58538818359375, -0.5069580078125, -0.42852783203125, -0.35009765625, -0.27166748046875, -0.1932373046875, -0.11480712890625, -0.036376953125, 0.04205322265625, 0.1204833984375, 0.19891357421875, 0.27734375, 0.35577392578125, 0.4342041015625, 0.51263427734375, 0.591064453125, 0.66949462890625, 0.7479248046875, 0.82635498046875, 0.90478515625, 0.98321533203125, 1.0616455078125, 1.14007568359375, 1.218505859375, 1.29693603515625, 1.3753662109375, 1.45379638671875, 1.5322265625, 1.61065673828125, 1.6890869140625, 1.76751708984375, 1.845947265625, 1.92437744140625, 2.0028076171875, 2.08123779296875, 2.15966796875, 2.23809814453125, 2.3165283203125, 2.39495849609375, 2.473388671875, 2.55181884765625, 2.6302490234375, 2.70867919921875, 2.787109375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 17.0, 28.0, 36.0, 68.0, 110.0, 128.0, 146.0, 125.0, 120.0, 84.0, 53.0, 46.0, 12.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.865299224853516, -33.67063903808594, -32.475975036621094, -31.281312942504883, -30.086650848388672, -28.891990661621094, -27.697328567504883, -26.502666473388672, -25.30800437927246, -24.11334228515625, -22.91868019104004, -21.724018096923828, -20.52935791015625, -19.334693908691406, -18.140033721923828, -16.945371627807617, -15.750709533691406, -14.556047439575195, -13.361385345458984, -12.16672420501709, -10.972062110900879, -9.777400016784668, -8.582738876342773, -7.3880767822265625, -6.193414688110352, -4.998752593994141, -3.804090976715088, -2.609429121017456, -1.4147672653198242, -0.22010517120361328, 0.9745564460754395, 2.169218063354492, 3.363880157470703, 4.558542251586914, 5.753203868865967, 6.9478654861450195, 8.14252758026123, 9.337189674377441, 10.531850814819336, 11.726512908935547, 12.921175003051758, 14.115837097167969, 15.31049919128418, 16.50516128540039, 17.69982147216797, 18.894485473632812, 20.08914566040039, 21.2838077545166, 22.478469848632812, 23.673131942749023, 24.867794036865234, 26.062456130981445, 27.257118225097656, 28.451778411865234, 29.646440505981445, 30.841102600097656, 32.0357666015625, 33.23042678833008, 34.42509078979492, 35.6197509765625, 36.814414978027344, 38.00907516479492, 39.203739166259766, 40.398399353027344, 41.59305953979492]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 3.0, 5.0, 8.0, 12.0, 11.0, 12.0, 24.0, 19.0, 29.0, 22.0, 30.0, 38.0, 23.0, 41.0, 30.0, 43.0, 42.0, 36.0, 45.0, 42.0, 44.0, 38.0, 36.0, 41.0, 47.0, 35.0, 36.0, 30.0, 24.0, 26.0, 18.0, 26.0, 19.0, 11.0, 9.0, 15.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.276134490966797, -18.637989044189453, -17.99984359741211, -17.361696243286133, -16.72355079650879, -16.085405349731445, -15.447259902954102, -14.809114456176758, -14.170968055725098, -13.532822608947754, -12.894676208496094, -12.25653076171875, -11.618385314941406, -10.980238914489746, -10.342093467712402, -9.703947067260742, -9.065801620483398, -8.427656173706055, -7.7895097732543945, -7.151364326477051, -6.513218402862549, -5.875072479248047, -5.236927032470703, -4.598781108856201, -3.960635185241699, -3.3224892616271973, -2.6843435764312744, -2.0461978912353516, -1.4080519676208496, -0.7699060440063477, -0.1317603588104248, 0.506385326385498, 1.14453125, 1.7826770544052124, 2.420822858810425, 3.0589685440063477, 3.6971144676208496, 4.335260391235352, 4.973405838012695, 5.611551761627197, 6.249697685241699, 6.887843608856201, 7.525989532470703, 8.164134979248047, 8.80228042602539, 9.44042682647705, 10.078572273254395, 10.716718673706055, 11.354864120483398, 11.993009567260742, 12.631155967712402, 13.269301414489746, 13.907447814941406, 14.54559326171875, 15.183738708496094, 15.821884155273438, 16.46002960205078, 17.098175048828125, 17.73632049560547, 18.374467849731445, 19.01261329650879, 19.650758743286133, 20.288904190063477, 20.92704963684082, 21.565196990966797]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 9.0, 12.0, 16.0, 13.0, 26.0, 37.0, 62.0, 78.0, 133.0, 154.0, 262.0, 395.0, 612.0, 1136.0, 1717.0, 3116.0, 5503.0, 10498.0, 21215.0, 47279.0, 129390.0, 805118.0, 2864481.0, 187369.0, 60960.0, 26582.0, 12938.0, 6570.0, 3555.0, 2036.0, 1221.0, 717.0, 413.0, 240.0, 149.0, 95.0, 61.0, 47.0, 31.0, 13.0, 10.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58203125, -4.44781494140625, -4.3135986328125, -4.17938232421875, -4.045166015625, -3.91094970703125, -3.7767333984375, -3.64251708984375, -3.50830078125, -3.37408447265625, -3.2398681640625, -3.10565185546875, -2.971435546875, -2.83721923828125, -2.7030029296875, -2.56878662109375, -2.4345703125, -2.30035400390625, -2.1661376953125, -2.03192138671875, -1.897705078125, -1.76348876953125, -1.6292724609375, -1.49505615234375, -1.36083984375, -1.22662353515625, -1.0924072265625, -0.95819091796875, -0.823974609375, -0.68975830078125, -0.5555419921875, -0.42132568359375, -0.287109375, -0.15289306640625, -0.0186767578125, 0.11553955078125, 0.249755859375, 0.38397216796875, 0.5181884765625, 0.65240478515625, 0.78662109375, 0.92083740234375, 1.0550537109375, 1.18927001953125, 1.323486328125, 1.45770263671875, 1.5919189453125, 1.72613525390625, 1.8603515625, 1.99456787109375, 2.1287841796875, 2.26300048828125, 2.397216796875, 2.53143310546875, 2.6656494140625, 2.79986572265625, 2.93408203125, 3.06829833984375, 3.2025146484375, 3.33673095703125, 3.470947265625, 3.60516357421875, 3.7393798828125, 3.87359619140625, 4.0078125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 5.0, 10.0, 14.0, 20.0, 15.0, 26.0, 34.0, 33.0, 45.0, 62.0, 53.0, 59.0, 59.0, 52.0, 53.0, 57.0, 54.0, 56.0, 43.0, 45.0, 33.0, 41.0, 19.0, 15.0, 22.0, 18.0, 14.0, 7.0, 6.0, 9.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4931640625, -1.455902099609375, -1.41864013671875, -1.381378173828125, -1.3441162109375, -1.306854248046875, -1.26959228515625, -1.232330322265625, -1.195068359375, -1.157806396484375, -1.12054443359375, -1.083282470703125, -1.0460205078125, -1.008758544921875, -0.97149658203125, -0.934234619140625, -0.89697265625, -0.859710693359375, -0.82244873046875, -0.785186767578125, -0.7479248046875, -0.710662841796875, -0.67340087890625, -0.636138916015625, -0.598876953125, -0.561614990234375, -0.52435302734375, -0.487091064453125, -0.4498291015625, -0.412567138671875, -0.37530517578125, -0.338043212890625, -0.30078125, -0.263519287109375, -0.22625732421875, -0.188995361328125, -0.1517333984375, -0.114471435546875, -0.07720947265625, -0.039947509765625, -0.002685546875, 0.034576416015625, 0.07183837890625, 0.109100341796875, 0.1463623046875, 0.183624267578125, 0.22088623046875, 0.258148193359375, 0.29541015625, 0.332672119140625, 0.36993408203125, 0.407196044921875, 0.4444580078125, 0.481719970703125, 0.51898193359375, 0.556243896484375, 0.593505859375, 0.630767822265625, 0.66802978515625, 0.705291748046875, 0.7425537109375, 0.779815673828125, 0.81707763671875, 0.854339599609375, 0.8916015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 10.0, 13.0, 18.0, 27.0, 36.0, 58.0, 94.0, 125.0, 174.0, 275.0, 381.0, 619.0, 975.0, 1652.0, 2797.0, 4884.0, 9356.0, 18591.0, 38668.0, 92221.0, 286777.0, 2726771.0, 734942.0, 157569.0, 60458.0, 27029.0, 13311.0, 6971.0, 3702.0, 2122.0, 1285.0, 811.0, 519.0, 343.0, 206.0, 140.0, 113.0, 60.0, 42.0, 34.0, 30.0, 23.0, 17.0, 12.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-4.4140625, -4.287078857421875, -4.16009521484375, -4.033111572265625, -3.9061279296875, -3.779144287109375, -3.65216064453125, -3.525177001953125, -3.398193359375, -3.271209716796875, -3.14422607421875, -3.017242431640625, -2.8902587890625, -2.763275146484375, -2.63629150390625, -2.509307861328125, -2.38232421875, -2.255340576171875, -2.12835693359375, -2.001373291015625, -1.8743896484375, -1.747406005859375, -1.62042236328125, -1.493438720703125, -1.366455078125, -1.239471435546875, -1.11248779296875, -0.985504150390625, -0.8585205078125, -0.731536865234375, -0.60455322265625, -0.477569580078125, -0.3505859375, -0.223602294921875, -0.09661865234375, 0.030364990234375, 0.1573486328125, 0.284332275390625, 0.41131591796875, 0.538299560546875, 0.665283203125, 0.792266845703125, 0.91925048828125, 1.046234130859375, 1.1732177734375, 1.300201416015625, 1.42718505859375, 1.554168701171875, 1.68115234375, 1.808135986328125, 1.93511962890625, 2.062103271484375, 2.1890869140625, 2.316070556640625, 2.44305419921875, 2.570037841796875, 2.697021484375, 2.824005126953125, 2.95098876953125, 3.077972412109375, 3.2049560546875, 3.331939697265625, 3.45892333984375, 3.585906982421875, 3.712890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 11.0, 12.0, 8.0, 17.0, 22.0, 33.0, 39.0, 54.0, 68.0, 129.0, 156.0, 309.0, 1191.0, 1060.0, 367.0, 194.0, 103.0, 79.0, 54.0, 43.0, 26.0, 21.0, 20.0, 11.0, 8.0, 10.0, 5.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0], "bins": [-2.900390625, -2.824005126953125, -2.74761962890625, -2.671234130859375, -2.5948486328125, -2.518463134765625, -2.44207763671875, -2.365692138671875, -2.289306640625, -2.212921142578125, -2.13653564453125, -2.060150146484375, -1.9837646484375, -1.907379150390625, -1.83099365234375, -1.754608154296875, -1.67822265625, -1.601837158203125, -1.52545166015625, -1.449066162109375, -1.3726806640625, -1.296295166015625, -1.21990966796875, -1.143524169921875, -1.067138671875, -0.990753173828125, -0.91436767578125, -0.837982177734375, -0.7615966796875, -0.685211181640625, -0.60882568359375, -0.532440185546875, -0.4560546875, -0.379669189453125, -0.30328369140625, -0.226898193359375, -0.1505126953125, -0.074127197265625, 0.00225830078125, 0.078643798828125, 0.155029296875, 0.231414794921875, 0.30780029296875, 0.384185791015625, 0.4605712890625, 0.536956787109375, 0.61334228515625, 0.689727783203125, 0.76611328125, 0.842498779296875, 0.91888427734375, 0.995269775390625, 1.0716552734375, 1.148040771484375, 1.22442626953125, 1.300811767578125, 1.377197265625, 1.453582763671875, 1.52996826171875, 1.606353759765625, 1.6827392578125, 1.759124755859375, 1.83551025390625, 1.911895751953125, 1.98828125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 17.0, 49.0, 135.0, 212.0, 245.0, 170.0, 91.0, 41.0, 17.0, 9.0, 1.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.15032196044922, -32.11724853515625, -31.08417510986328, -30.05109977722168, -29.01802635192871, -27.984952926635742, -26.95187759399414, -25.918804168701172, -24.885730743408203, -23.852657318115234, -22.819583892822266, -21.786508560180664, -20.753435134887695, -19.720361709594727, -18.687286376953125, -17.654212951660156, -16.621139526367188, -15.588066101074219, -14.554991722106934, -13.521917343139648, -12.48884391784668, -11.455770492553711, -10.422696113586426, -9.38962173461914, -8.356548309326172, -7.323474407196045, -6.290400505065918, -5.257326602935791, -4.224252700805664, -3.191178798675537, -2.15810489654541, -1.1250309944152832, -0.09195709228515625, 0.9411168098449707, 1.9741907119750977, 3.0072646141052246, 4.040338516235352, 5.0734124183654785, 6.1064863204956055, 7.139560222625732, 8.17263412475586, 9.205707550048828, 10.238781929016113, 11.271856307983398, 12.304929733276367, 13.338003158569336, 14.371077537536621, 15.404151916503906, 16.437225341796875, 17.470298767089844, 18.503372192382812, 19.536447525024414, 20.569520950317383, 21.60259437561035, 22.635669708251953, 23.668743133544922, 24.70181655883789, 25.73488998413086, 26.767963409423828, 27.80103874206543, 28.8341121673584, 29.867185592651367, 30.90026092529297, 31.933334350585938, 32.966407775878906]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 16.0, 12.0, 16.0, 14.0, 24.0, 20.0, 27.0, 31.0, 32.0, 32.0, 51.0, 41.0, 44.0, 45.0, 53.0, 47.0, 41.0, 49.0, 42.0, 45.0, 37.0, 21.0, 39.0, 30.0, 24.0, 25.0, 23.0, 16.0, 16.0, 15.0, 14.0, 5.0, 7.0, 8.0, 11.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.166526794433594, -9.8659086227417, -9.565290451049805, -9.264673233032227, -8.964055061340332, -8.663436889648438, -8.362818717956543, -8.062200546264648, -7.761582374572754, -7.460964202880859, -7.160346508026123, -6.8597283363342285, -6.559110164642334, -6.258492469787598, -5.957874298095703, -5.657256126403809, -5.356638431549072, -5.056020259857178, -4.755402565002441, -4.454784393310547, -4.154166221618652, -3.853548288345337, -3.5529303550720215, -3.252312183380127, -2.9516942501068115, -2.651076316833496, -2.3504581451416016, -2.049840211868286, -1.7492221593856812, -1.4486041069030762, -1.1479861736297607, -0.8473680019378662, -0.5467500686645508, -0.2461320459842682, 0.054485976696014404, 0.3551039695739746, 0.6557220220565796, 0.9563400745391846, 1.2569580078125, 1.5575761795043945, 1.85819411277771, 2.1588120460510254, 2.45943021774292, 2.7600481510162354, 3.060666084289551, 3.3612842559814453, 3.6619021892547607, 3.9625203609466553, 4.263138294219971, 4.563756465911865, 4.864374160766602, 5.164992332458496, 5.465610504150391, 5.766228675842285, 6.0668463706970215, 6.367464542388916, 6.668082237243652, 6.968700408935547, 7.269318103790283, 7.569936275482178, 7.870554447174072, 8.171172142028809, 8.471790313720703, 8.772408485412598, 9.073026657104492]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 4.0, 5.0, 14.0, 12.0, 17.0, 14.0, 30.0, 37.0, 54.0, 87.0, 113.0, 189.0, 271.0, 466.0, 875.0, 1596.0, 3228.0, 6144.0, 12347.0, 25160.0, 47547.0, 89519.0, 190154.0, 335395.0, 166192.0, 80656.0, 43263.0, 22257.0, 11009.0, 5547.0, 2831.0, 1528.0, 727.0, 442.0, 276.0, 162.0, 122.0, 75.0, 58.0, 41.0, 24.0, 17.0, 16.0, 8.0, 11.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.826171875, -2.719207763671875, -2.61224365234375, -2.505279541015625, -2.3983154296875, -2.291351318359375, -2.18438720703125, -2.077423095703125, -1.970458984375, -1.863494873046875, -1.75653076171875, -1.649566650390625, -1.5426025390625, -1.435638427734375, -1.32867431640625, -1.221710205078125, -1.11474609375, -1.007781982421875, -0.90081787109375, -0.793853759765625, -0.6868896484375, -0.579925537109375, -0.47296142578125, -0.365997314453125, -0.259033203125, -0.152069091796875, -0.04510498046875, 0.061859130859375, 0.1688232421875, 0.275787353515625, 0.38275146484375, 0.489715576171875, 0.5966796875, 0.703643798828125, 0.81060791015625, 0.917572021484375, 1.0245361328125, 1.131500244140625, 1.23846435546875, 1.345428466796875, 1.452392578125, 1.559356689453125, 1.66632080078125, 1.773284912109375, 1.8802490234375, 1.987213134765625, 2.09417724609375, 2.201141357421875, 2.30810546875, 2.415069580078125, 2.52203369140625, 2.628997802734375, 2.7359619140625, 2.842926025390625, 2.94989013671875, 3.056854248046875, 3.163818359375, 3.270782470703125, 3.37774658203125, 3.484710693359375, 3.5916748046875, 3.698638916015625, 3.80560302734375, 3.912567138671875, 4.01953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 6.0, 9.0, 6.0, 8.0, 13.0, 17.0, 12.0, 19.0, 18.0, 17.0, 21.0, 39.0, 34.0, 49.0, 34.0, 42.0, 32.0, 40.0, 51.0, 45.0, 53.0, 38.0, 39.0, 38.0, 29.0, 43.0, 19.0, 31.0, 17.0, 23.0, 19.0, 18.0, 23.0, 19.0, 15.0, 10.0, 12.0, 5.0, 4.0, 10.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.001953125, -0.97119140625, -0.9404296875, -0.90966796875, -0.87890625, -0.84814453125, -0.8173828125, -0.78662109375, -0.755859375, -0.72509765625, -0.6943359375, -0.66357421875, -0.6328125, -0.60205078125, -0.5712890625, -0.54052734375, -0.509765625, -0.47900390625, -0.4482421875, -0.41748046875, -0.38671875, -0.35595703125, -0.3251953125, -0.29443359375, -0.263671875, -0.23291015625, -0.2021484375, -0.17138671875, -0.140625, -0.10986328125, -0.0791015625, -0.04833984375, -0.017578125, 0.01318359375, 0.0439453125, 0.07470703125, 0.10546875, 0.13623046875, 0.1669921875, 0.19775390625, 0.228515625, 0.25927734375, 0.2900390625, 0.32080078125, 0.3515625, 0.38232421875, 0.4130859375, 0.44384765625, 0.474609375, 0.50537109375, 0.5361328125, 0.56689453125, 0.59765625, 0.62841796875, 0.6591796875, 0.68994140625, 0.720703125, 0.75146484375, 0.7822265625, 0.81298828125, 0.84375, 0.87451171875, 0.9052734375, 0.93603515625, 0.966796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 2.0, 9.0, 5.0, 20.0, 19.0, 19.0, 29.0, 50.0, 72.0, 91.0, 116.0, 165.0, 231.0, 402.0, 681.0, 1282.0, 3500.0, 18155.0, 136451.0, 724645.0, 137353.0, 18389.0, 3653.0, 1311.0, 648.0, 422.0, 247.0, 194.0, 122.0, 84.0, 48.0, 38.0, 36.0, 17.0, 11.0, 7.0, 8.0, 7.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5078125, -10.2032470703125, -9.898681640625, -9.5941162109375, -9.28955078125, -8.9849853515625, -8.680419921875, -8.3758544921875, -8.0712890625, -7.7667236328125, -7.462158203125, -7.1575927734375, -6.85302734375, -6.5484619140625, -6.243896484375, -5.9393310546875, -5.634765625, -5.3302001953125, -5.025634765625, -4.7210693359375, -4.41650390625, -4.1119384765625, -3.807373046875, -3.5028076171875, -3.1982421875, -2.8936767578125, -2.589111328125, -2.2845458984375, -1.97998046875, -1.6754150390625, -1.370849609375, -1.0662841796875, -0.76171875, -0.4571533203125, -0.152587890625, 0.1519775390625, 0.45654296875, 0.7611083984375, 1.065673828125, 1.3702392578125, 1.6748046875, 1.9793701171875, 2.283935546875, 2.5885009765625, 2.89306640625, 3.1976318359375, 3.502197265625, 3.8067626953125, 4.111328125, 4.4158935546875, 4.720458984375, 5.0250244140625, 5.32958984375, 5.6341552734375, 5.938720703125, 6.2432861328125, 6.5478515625, 6.8524169921875, 7.156982421875, 7.4615478515625, 7.76611328125, 8.0706787109375, 8.375244140625, 8.6798095703125, 8.984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 8.0, 5.0, 12.0, 8.0, 19.0, 16.0, 18.0, 26.0, 36.0, 27.0, 35.0, 40.0, 46.0, 40.0, 59.0, 53.0, 45.0, 47.0, 54.0, 49.0, 44.0, 44.0, 40.0, 36.0, 32.0, 32.0, 23.0, 23.0, 16.0, 15.0, 13.0, 10.0, 1.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.51953125, -5.3348388671875, -5.150146484375, -4.9654541015625, -4.78076171875, -4.5960693359375, -4.411376953125, -4.2266845703125, -4.0419921875, -3.8572998046875, -3.672607421875, -3.4879150390625, -3.30322265625, -3.1185302734375, -2.933837890625, -2.7491455078125, -2.564453125, -2.3797607421875, -2.195068359375, -2.0103759765625, -1.82568359375, -1.6409912109375, -1.456298828125, -1.2716064453125, -1.0869140625, -0.9022216796875, -0.717529296875, -0.5328369140625, -0.34814453125, -0.1634521484375, 0.021240234375, 0.2059326171875, 0.390625, 0.5753173828125, 0.760009765625, 0.9447021484375, 1.12939453125, 1.3140869140625, 1.498779296875, 1.6834716796875, 1.8681640625, 2.0528564453125, 2.237548828125, 2.4222412109375, 2.60693359375, 2.7916259765625, 2.976318359375, 3.1610107421875, 3.345703125, 3.5303955078125, 3.715087890625, 3.8997802734375, 4.08447265625, 4.2691650390625, 4.453857421875, 4.6385498046875, 4.8232421875, 5.0079345703125, 5.192626953125, 5.3773193359375, 5.56201171875, 5.7467041015625, 5.931396484375, 6.1160888671875, 6.30078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 13.0, 18.0, 24.0, 27.0, 48.0, 66.0, 77.0, 115.0, 161.0, 204.0, 337.0, 533.0, 800.0, 1337.0, 2379.0, 4969.0, 12947.0, 41801.0, 169080.0, 609593.0, 145232.0, 36855.0, 11564.0, 4529.0, 2272.0, 1260.0, 762.0, 471.0, 290.0, 247.0, 143.0, 109.0, 65.0, 65.0, 34.0, 27.0, 28.0, 16.0, 11.0, 12.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.74609375, -3.630645751953125, -3.51519775390625, -3.399749755859375, -3.2843017578125, -3.168853759765625, -3.05340576171875, -2.937957763671875, -2.822509765625, -2.707061767578125, -2.59161376953125, -2.476165771484375, -2.3607177734375, -2.245269775390625, -2.12982177734375, -2.014373779296875, -1.89892578125, -1.783477783203125, -1.66802978515625, -1.552581787109375, -1.4371337890625, -1.321685791015625, -1.20623779296875, -1.090789794921875, -0.975341796875, -0.859893798828125, -0.74444580078125, -0.628997802734375, -0.5135498046875, -0.398101806640625, -0.28265380859375, -0.167205810546875, -0.0517578125, 0.063690185546875, 0.17913818359375, 0.294586181640625, 0.4100341796875, 0.525482177734375, 0.64093017578125, 0.756378173828125, 0.871826171875, 0.987274169921875, 1.10272216796875, 1.218170166015625, 1.3336181640625, 1.449066162109375, 1.56451416015625, 1.679962158203125, 1.79541015625, 1.910858154296875, 2.02630615234375, 2.141754150390625, 2.2572021484375, 2.372650146484375, 2.48809814453125, 2.603546142578125, 2.718994140625, 2.834442138671875, 2.94989013671875, 3.065338134765625, 3.1807861328125, 3.296234130859375, 3.41168212890625, 3.527130126953125, 3.642578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 5.0, 10.0, 13.0, 12.0, 19.0, 23.0, 31.0, 29.0, 40.0, 58.0, 107.0, 263.0, 114.0, 59.0, 50.0, 36.0, 35.0, 15.0, 20.0, 13.0, 8.0, 8.0, 9.0, 7.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0011301040649414062, -0.0010991916060447693, -0.0010682791471481323, -0.0010373666882514954, -0.0010064542293548584, -0.0009755417704582214, -0.0009446293115615845, -0.0009137168526649475, -0.0008828043937683105, -0.0008518919348716736, -0.0008209794759750366, -0.0007900670170783997, -0.0007591545581817627, -0.0007282420992851257, -0.0006973296403884888, -0.0006664171814918518, -0.0006355047225952148, -0.0006045922636985779, -0.0005736798048019409, -0.000542767345905304, -0.000511854887008667, -0.00048094242811203003, -0.00045002996921539307, -0.0004191175103187561, -0.00038820505142211914, -0.0003572925925254822, -0.0003263801336288452, -0.00029546767473220825, -0.0002645552158355713, -0.00023364275693893433, -0.00020273029804229736, -0.0001718178391456604, -0.00014090538024902344, -0.00010999292135238647, -7.908046245574951e-05, -4.816800355911255e-05, -1.7255544662475586e-05, 1.3656914234161377e-05, 4.456937313079834e-05, 7.54818320274353e-05, 0.00010639429092407227, 0.00013730674982070923, 0.0001682192087173462, 0.00019913166761398315, 0.00023004412651062012, 0.0002609565854072571, 0.00029186904430389404, 0.000322781503200531, 0.00035369396209716797, 0.00038460642099380493, 0.0004155188798904419, 0.00044643133878707886, 0.0004773437976837158, 0.0005082562565803528, 0.0005391687154769897, 0.0005700811743736267, 0.0006009936332702637, 0.0006319060921669006, 0.0006628185510635376, 0.0006937310099601746, 0.0007246434688568115, 0.0007555559277534485, 0.0007864683866500854, 0.0008173808455467224, 0.0008482933044433594]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 13.0, 10.0, 35.0, 36.0, 42.0, 69.0, 110.0, 201.0, 349.0, 816.0, 1875.0, 5254.0, 27512.0, 532031.0, 447496.0, 24351.0, 4996.0, 1733.0, 757.0, 344.0, 189.0, 104.0, 67.0, 46.0, 35.0, 25.0, 11.0, 15.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1796875, -7.94580078125, -7.7119140625, -7.47802734375, -7.244140625, -7.01025390625, -6.7763671875, -6.54248046875, -6.30859375, -6.07470703125, -5.8408203125, -5.60693359375, -5.373046875, -5.13916015625, -4.9052734375, -4.67138671875, -4.4375, -4.20361328125, -3.9697265625, -3.73583984375, -3.501953125, -3.26806640625, -3.0341796875, -2.80029296875, -2.56640625, -2.33251953125, -2.0986328125, -1.86474609375, -1.630859375, -1.39697265625, -1.1630859375, -0.92919921875, -0.6953125, -0.46142578125, -0.2275390625, 0.00634765625, 0.240234375, 0.47412109375, 0.7080078125, 0.94189453125, 1.17578125, 1.40966796875, 1.6435546875, 1.87744140625, 2.111328125, 2.34521484375, 2.5791015625, 2.81298828125, 3.046875, 3.28076171875, 3.5146484375, 3.74853515625, 3.982421875, 4.21630859375, 4.4501953125, 4.68408203125, 4.91796875, 5.15185546875, 5.3857421875, 5.61962890625, 5.853515625, 6.08740234375, 6.3212890625, 6.55517578125, 6.7890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 3.0, 9.0, 11.0, 13.0, 23.0, 20.0, 48.0, 74.0, 108.0, 143.0, 152.0, 146.0, 64.0, 67.0, 37.0, 20.0, 26.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.359375, -6.20123291015625, -6.0430908203125, -5.88494873046875, -5.726806640625, -5.56866455078125, -5.4105224609375, -5.25238037109375, -5.09423828125, -4.93609619140625, -4.7779541015625, -4.61981201171875, -4.461669921875, -4.30352783203125, -4.1453857421875, -3.98724365234375, -3.8291015625, -3.67095947265625, -3.5128173828125, -3.35467529296875, -3.196533203125, -3.03839111328125, -2.8802490234375, -2.72210693359375, -2.56396484375, -2.40582275390625, -2.2476806640625, -2.08953857421875, -1.931396484375, -1.77325439453125, -1.6151123046875, -1.45697021484375, -1.298828125, -1.14068603515625, -0.9825439453125, -0.82440185546875, -0.666259765625, -0.50811767578125, -0.3499755859375, -0.19183349609375, -0.03369140625, 0.12445068359375, 0.2825927734375, 0.44073486328125, 0.598876953125, 0.75701904296875, 0.9151611328125, 1.07330322265625, 1.2314453125, 1.38958740234375, 1.5477294921875, 1.70587158203125, 1.864013671875, 2.02215576171875, 2.1802978515625, 2.33843994140625, 2.49658203125, 2.65472412109375, 2.8128662109375, 2.97100830078125, 3.129150390625, 3.28729248046875, 3.4454345703125, 3.60357666015625, 3.76171875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 13.0, 32.0, 41.0, 75.0, 105.0, 122.0, 138.0, 156.0, 128.0, 78.0, 50.0, 27.0, 12.0, 3.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.173377990722656, -51.423099517822266, -49.672821044921875, -47.92253875732422, -46.17226028442383, -44.42198181152344, -42.67169952392578, -40.92142105102539, -39.171142578125, -37.42086410522461, -35.67058563232422, -33.92030334472656, -32.17002487182617, -30.41974639892578, -28.669466018676758, -26.919185638427734, -25.168907165527344, -23.418628692626953, -21.66834831237793, -19.918067932128906, -18.167789459228516, -16.417510986328125, -14.667230606079102, -12.916951179504395, -11.166671752929688, -9.41639232635498, -7.666112899780273, -5.915833473205566, -4.165554046630859, -2.4152746200561523, -0.6649951934814453, 1.0852842330932617, 2.8355636596679688, 4.585843086242676, 6.336122512817383, 8.08640193939209, 9.836681365966797, 11.586960792541504, 13.337240219116211, 15.087519645690918, 16.837799072265625, 18.588077545166016, 20.33835792541504, 22.088638305664062, 23.838916778564453, 25.589195251464844, 27.339475631713867, 29.08975601196289, 30.84003448486328, 32.59031295776367, 34.34059143066406, 36.09087371826172, 37.84115219116211, 39.5914306640625, 41.341712951660156, 43.09199142456055, 44.84226989746094, 46.59254837036133, 48.34282684326172, 50.093109130859375, 51.843387603759766, 53.593666076660156, 55.34394836425781, 57.0942268371582, 58.844505310058594]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 9.0, 8.0, 19.0, 10.0, 12.0, 13.0, 18.0, 30.0, 25.0, 28.0, 37.0, 46.0, 26.0, 31.0, 41.0, 35.0, 62.0, 45.0, 51.0, 41.0, 49.0, 33.0, 39.0, 36.0, 41.0, 33.0, 23.0, 25.0, 23.0, 19.0, 13.0, 16.0, 16.0, 8.0, 6.0, 5.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.392677307128906, -27.44343376159668, -26.494190216064453, -25.544946670532227, -24.595703125, -23.64645767211914, -22.697216033935547, -21.747970581054688, -20.79872703552246, -19.849483489990234, -18.900239944458008, -17.95099639892578, -17.001752853393555, -16.052509307861328, -15.103264808654785, -14.154020309448242, -13.204777717590332, -12.255534172058105, -11.306290626525879, -10.357046127319336, -9.40780258178711, -8.458559036254883, -7.509315490722656, -6.5600714683532715, -5.610827922821045, -4.661584377288818, -3.7123403549194336, -2.763096809387207, -1.8138530254364014, -0.8646092414855957, 0.08463430404663086, 1.0338783264160156, 1.9831218719482422, 2.932365655899048, 3.8816094398498535, 4.83085298538208, 5.780097007751465, 6.729340553283691, 7.678584098815918, 8.627828598022461, 9.577072143554688, 10.526315689086914, 11.47555923461914, 12.424802780151367, 13.37404727935791, 14.323290824890137, 15.272534370422363, 16.221778869628906, 17.1710205078125, 18.120264053344727, 19.069507598876953, 20.01875114440918, 20.967994689941406, 21.917240142822266, 22.86648178100586, 23.81572723388672, 24.764970779418945, 25.714214324951172, 26.6634578704834, 27.612701416015625, 28.56194496154785, 29.511188507080078, 30.460433959960938, 31.409677505493164, 32.35892105102539]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 7.0, 16.0, 19.0, 16.0, 28.0, 38.0, 57.0, 81.0, 122.0, 172.0, 212.0, 322.0, 478.0, 662.0, 1049.0, 1644.0, 2427.0, 4026.0, 6600.0, 11742.0, 21844.0, 45009.0, 109516.0, 398917.0, 2914325.0, 455472.0, 119053.0, 47546.0, 23037.0, 11947.0, 6903.0, 3980.0, 2548.0, 1518.0, 1011.0, 627.0, 422.0, 306.0, 194.0, 105.0, 84.0, 62.0, 37.0, 26.0, 20.0, 15.0, 8.0, 11.0, 10.0, 5.0, 3.0, 2.0, 2.0], "bins": [-3.916015625, -3.805816650390625, -3.69561767578125, -3.585418701171875, -3.4752197265625, -3.365020751953125, -3.25482177734375, -3.144622802734375, -3.034423828125, -2.924224853515625, -2.81402587890625, -2.703826904296875, -2.5936279296875, -2.483428955078125, -2.37322998046875, -2.263031005859375, -2.15283203125, -2.042633056640625, -1.93243408203125, -1.822235107421875, -1.7120361328125, -1.601837158203125, -1.49163818359375, -1.381439208984375, -1.271240234375, -1.161041259765625, -1.05084228515625, -0.940643310546875, -0.8304443359375, -0.720245361328125, -0.61004638671875, -0.499847412109375, -0.3896484375, -0.279449462890625, -0.16925048828125, -0.059051513671875, 0.0511474609375, 0.161346435546875, 0.27154541015625, 0.381744384765625, 0.491943359375, 0.602142333984375, 0.71234130859375, 0.822540283203125, 0.9327392578125, 1.042938232421875, 1.15313720703125, 1.263336181640625, 1.37353515625, 1.483734130859375, 1.59393310546875, 1.704132080078125, 1.8143310546875, 1.924530029296875, 2.03472900390625, 2.144927978515625, 2.255126953125, 2.365325927734375, 2.47552490234375, 2.585723876953125, 2.6959228515625, 2.806121826171875, 2.91632080078125, 3.026519775390625, 3.13671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 4.0, 7.0, 6.0, 16.0, 17.0, 28.0, 20.0, 22.0, 33.0, 42.0, 51.0, 50.0, 31.0, 55.0, 61.0, 56.0, 58.0, 54.0, 49.0, 46.0, 45.0, 47.0, 48.0, 26.0, 30.0, 18.0, 23.0, 10.0, 16.0, 14.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4033203125, -1.3564300537109375, -1.309539794921875, -1.2626495361328125, -1.21575927734375, -1.1688690185546875, -1.121978759765625, -1.0750885009765625, -1.0281982421875, -0.9813079833984375, -0.934417724609375, -0.8875274658203125, -0.84063720703125, -0.7937469482421875, -0.746856689453125, -0.6999664306640625, -0.653076171875, -0.6061859130859375, -0.559295654296875, -0.5124053955078125, -0.46551513671875, -0.4186248779296875, -0.371734619140625, -0.3248443603515625, -0.2779541015625, -0.2310638427734375, -0.184173583984375, -0.1372833251953125, -0.09039306640625, -0.0435028076171875, 0.003387451171875, 0.0502777099609375, 0.09716796875, 0.1440582275390625, 0.190948486328125, 0.2378387451171875, 0.28472900390625, 0.3316192626953125, 0.378509521484375, 0.4253997802734375, 0.4722900390625, 0.5191802978515625, 0.566070556640625, 0.6129608154296875, 0.65985107421875, 0.7067413330078125, 0.753631591796875, 0.8005218505859375, 0.847412109375, 0.8943023681640625, 0.941192626953125, 0.9880828857421875, 1.03497314453125, 1.0818634033203125, 1.128753662109375, 1.1756439208984375, 1.2225341796875, 1.2694244384765625, 1.316314697265625, 1.3632049560546875, 1.41009521484375, 1.4569854736328125, 1.503875732421875, 1.5507659912109375, 1.59765625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 2.0, 6.0, 7.0, 13.0, 13.0, 31.0, 69.0, 122.0, 183.0, 313.0, 683.0, 1705.0, 4624.0, 14723.0, 59980.0, 408362.0, 3361016.0, 276991.0, 46323.0, 12342.0, 3884.0, 1573.0, 632.0, 300.0, 160.0, 86.0, 52.0, 38.0, 22.0, 11.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.890625, -7.6312255859375, -7.371826171875, -7.1124267578125, -6.85302734375, -6.5936279296875, -6.334228515625, -6.0748291015625, -5.8154296875, -5.5560302734375, -5.296630859375, -5.0372314453125, -4.77783203125, -4.5184326171875, -4.259033203125, -3.9996337890625, -3.740234375, -3.4808349609375, -3.221435546875, -2.9620361328125, -2.70263671875, -2.4432373046875, -2.183837890625, -1.9244384765625, -1.6650390625, -1.4056396484375, -1.146240234375, -0.8868408203125, -0.62744140625, -0.3680419921875, -0.108642578125, 0.1507568359375, 0.41015625, 0.6695556640625, 0.928955078125, 1.1883544921875, 1.44775390625, 1.7071533203125, 1.966552734375, 2.2259521484375, 2.4853515625, 2.7447509765625, 3.004150390625, 3.2635498046875, 3.52294921875, 3.7823486328125, 4.041748046875, 4.3011474609375, 4.560546875, 4.8199462890625, 5.079345703125, 5.3387451171875, 5.59814453125, 5.8575439453125, 6.116943359375, 6.3763427734375, 6.6357421875, 6.8951416015625, 7.154541015625, 7.4139404296875, 7.67333984375, 7.9327392578125, 8.192138671875, 8.4515380859375, 8.7109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 4.0, 6.0, 8.0, 17.0, 15.0, 22.0, 28.0, 50.0, 71.0, 112.0, 176.0, 361.0, 1036.0, 1294.0, 387.0, 194.0, 105.0, 61.0, 44.0, 24.0, 20.0, 16.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.798828125, -3.663360595703125, -3.52789306640625, -3.392425537109375, -3.2569580078125, -3.121490478515625, -2.98602294921875, -2.850555419921875, -2.715087890625, -2.579620361328125, -2.44415283203125, -2.308685302734375, -2.1732177734375, -2.037750244140625, -1.90228271484375, -1.766815185546875, -1.63134765625, -1.495880126953125, -1.36041259765625, -1.224945068359375, -1.0894775390625, -0.954010009765625, -0.81854248046875, -0.683074951171875, -0.547607421875, -0.412139892578125, -0.27667236328125, -0.141204833984375, -0.0057373046875, 0.129730224609375, 0.26519775390625, 0.400665283203125, 0.5361328125, 0.671600341796875, 0.80706787109375, 0.942535400390625, 1.0780029296875, 1.213470458984375, 1.34893798828125, 1.484405517578125, 1.619873046875, 1.755340576171875, 1.89080810546875, 2.026275634765625, 2.1617431640625, 2.297210693359375, 2.43267822265625, 2.568145751953125, 2.70361328125, 2.839080810546875, 2.97454833984375, 3.110015869140625, 3.2454833984375, 3.380950927734375, 3.51641845703125, 3.651885986328125, 3.787353515625, 3.922821044921875, 4.05828857421875, 4.193756103515625, 4.3292236328125, 4.464691162109375, 4.60015869140625, 4.735626220703125, 4.87109375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 10.0, 11.0, 8.0, 19.0, 27.0, 26.0, 32.0, 48.0, 80.0, 60.0, 85.0, 71.0, 106.0, 80.0, 80.0, 70.0, 54.0, 39.0, 29.0, 22.0, 10.0, 8.0, 8.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.355403900146484, -17.81327247619629, -17.27113914489746, -16.729007720947266, -16.186874389648438, -15.644742965698242, -15.102611541748047, -14.560479164123535, -14.018346786499023, -13.476214408874512, -12.93408203125, -12.391950607299805, -11.849818229675293, -11.307685852050781, -10.765554428100586, -10.223422050476074, -9.681289672851562, -9.13915729522705, -8.597024917602539, -8.054893493652344, -7.512761116027832, -6.97062873840332, -6.428496837615967, -5.886364936828613, -5.344232559204102, -4.80210018157959, -4.259968280792236, -3.7178361415863037, -3.175704002380371, -2.6335718631744385, -2.091439723968506, -1.5493075847625732, -1.0071754455566406, -0.465043306350708, 0.07708883285522461, 0.6192209720611572, 1.1613531112670898, 1.7034852504730225, 2.245617389678955, 2.7877495288848877, 3.3298816680908203, 3.872013807296753, 4.4141459465026855, 4.956277847290039, 5.498410224914551, 6.0405426025390625, 6.582674503326416, 7.1248064041137695, 7.666938781738281, 8.209071159362793, 8.751203536987305, 9.2933349609375, 9.835467338562012, 10.377599716186523, 10.919731140136719, 11.46186351776123, 12.003995895385742, 12.546128273010254, 13.088260650634766, 13.630392074584961, 14.172524452209473, 14.714656829833984, 15.25678825378418, 15.798920631408691, 16.341053009033203]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 7.0, 8.0, 15.0, 16.0, 18.0, 33.0, 25.0, 15.0, 34.0, 30.0, 38.0, 39.0, 47.0, 41.0, 49.0, 36.0, 40.0, 49.0, 44.0, 40.0, 44.0, 40.0, 31.0, 38.0, 24.0, 32.0, 26.0, 23.0, 16.0, 14.0, 12.0, 9.0, 14.0, 8.0, 6.0, 3.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-14.465404510498047, -14.067216873168945, -13.669029235839844, -13.270841598510742, -12.87265396118164, -12.474466323852539, -12.076278686523438, -11.678091049194336, -11.279903411865234, -10.881715774536133, -10.483528137207031, -10.08534049987793, -9.687152862548828, -9.288965225219727, -8.890777587890625, -8.492589950561523, -8.094402313232422, -7.69621467590332, -7.298027038574219, -6.899839401245117, -6.501651763916016, -6.103464126586914, -5.7052764892578125, -5.307088851928711, -4.908901214599609, -4.510713577270508, -4.112525939941406, -3.7143383026123047, -3.316150665283203, -2.9179630279541016, -2.519775390625, -2.1215877532958984, -1.7234001159667969, -1.3252124786376953, -0.9270248413085938, -0.5288372039794922, -0.13064956665039062, 0.26753807067871094, 0.6657257080078125, 1.063913345336914, 1.4621009826660156, 1.8602886199951172, 2.2584762573242188, 2.6566638946533203, 3.054851531982422, 3.4530391693115234, 3.851226806640625, 4.249414443969727, 4.647602081298828, 5.04578971862793, 5.443977355957031, 5.842164993286133, 6.240352630615234, 6.638540267944336, 7.0367279052734375, 7.434915542602539, 7.833103179931641, 8.231290817260742, 8.629478454589844, 9.027666091918945, 9.425853729248047, 9.824041366577148, 10.22222900390625, 10.620416641235352, 11.018604278564453]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 9.0, 11.0, 18.0, 23.0, 39.0, 64.0, 79.0, 114.0, 165.0, 246.0, 370.0, 613.0, 981.0, 1630.0, 2631.0, 4797.0, 8226.0, 14987.0, 26579.0, 48148.0, 87003.0, 149399.0, 215231.0, 197831.0, 126692.0, 72116.0, 39897.0, 21891.0, 12193.0, 6684.0, 3951.0, 2290.0, 1323.0, 813.0, 530.0, 281.0, 224.0, 121.0, 104.0, 67.0, 57.0, 30.0, 29.0, 13.0, 17.0, 11.0, 10.0, 7.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.83984375, -2.750640869140625, -2.66143798828125, -2.572235107421875, -2.4830322265625, -2.393829345703125, -2.30462646484375, -2.215423583984375, -2.126220703125, -2.037017822265625, -1.94781494140625, -1.858612060546875, -1.7694091796875, -1.680206298828125, -1.59100341796875, -1.501800537109375, -1.41259765625, -1.323394775390625, -1.23419189453125, -1.144989013671875, -1.0557861328125, -0.966583251953125, -0.87738037109375, -0.788177490234375, -0.698974609375, -0.609771728515625, -0.52056884765625, -0.431365966796875, -0.3421630859375, -0.252960205078125, -0.16375732421875, -0.074554443359375, 0.0146484375, 0.103851318359375, 0.19305419921875, 0.282257080078125, 0.3714599609375, 0.460662841796875, 0.54986572265625, 0.639068603515625, 0.728271484375, 0.817474365234375, 0.90667724609375, 0.995880126953125, 1.0850830078125, 1.174285888671875, 1.26348876953125, 1.352691650390625, 1.44189453125, 1.531097412109375, 1.62030029296875, 1.709503173828125, 1.7987060546875, 1.887908935546875, 1.97711181640625, 2.066314697265625, 2.155517578125, 2.244720458984375, 2.33392333984375, 2.423126220703125, 2.5123291015625, 2.601531982421875, 2.69073486328125, 2.779937744140625, 2.869140625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 11.0, 7.0, 9.0, 14.0, 17.0, 23.0, 26.0, 27.0, 32.0, 37.0, 28.0, 42.0, 48.0, 47.0, 49.0, 42.0, 47.0, 50.0, 36.0, 45.0, 49.0, 50.0, 32.0, 41.0, 22.0, 23.0, 27.0, 23.0, 15.0, 16.0, 17.0, 9.0, 10.0, 9.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.56640625, -1.52099609375, -1.4755859375, -1.43017578125, -1.384765625, -1.33935546875, -1.2939453125, -1.24853515625, -1.203125, -1.15771484375, -1.1123046875, -1.06689453125, -1.021484375, -0.97607421875, -0.9306640625, -0.88525390625, -0.83984375, -0.79443359375, -0.7490234375, -0.70361328125, -0.658203125, -0.61279296875, -0.5673828125, -0.52197265625, -0.4765625, -0.43115234375, -0.3857421875, -0.34033203125, -0.294921875, -0.24951171875, -0.2041015625, -0.15869140625, -0.11328125, -0.06787109375, -0.0224609375, 0.02294921875, 0.068359375, 0.11376953125, 0.1591796875, 0.20458984375, 0.25, 0.29541015625, 0.3408203125, 0.38623046875, 0.431640625, 0.47705078125, 0.5224609375, 0.56787109375, 0.61328125, 0.65869140625, 0.7041015625, 0.74951171875, 0.794921875, 0.84033203125, 0.8857421875, 0.93115234375, 0.9765625, 1.02197265625, 1.0673828125, 1.11279296875, 1.158203125, 1.20361328125, 1.2490234375, 1.29443359375, 1.33984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 7.0, 5.0, 8.0, 13.0, 14.0, 24.0, 44.0, 41.0, 57.0, 100.0, 158.0, 253.0, 318.0, 529.0, 863.0, 2038.0, 7017.0, 50514.0, 500672.0, 432967.0, 42454.0, 6248.0, 1792.0, 896.0, 478.0, 324.0, 213.0, 143.0, 101.0, 66.0, 42.0, 37.0, 27.0, 17.0, 21.0, 13.0, 8.0, 6.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.65625, -9.3109130859375, -8.965576171875, -8.6202392578125, -8.27490234375, -7.9295654296875, -7.584228515625, -7.2388916015625, -6.8935546875, -6.5482177734375, -6.202880859375, -5.8575439453125, -5.51220703125, -5.1668701171875, -4.821533203125, -4.4761962890625, -4.130859375, -3.7855224609375, -3.440185546875, -3.0948486328125, -2.74951171875, -2.4041748046875, -2.058837890625, -1.7135009765625, -1.3681640625, -1.0228271484375, -0.677490234375, -0.3321533203125, 0.01318359375, 0.3585205078125, 0.703857421875, 1.0491943359375, 1.39453125, 1.7398681640625, 2.085205078125, 2.4305419921875, 2.77587890625, 3.1212158203125, 3.466552734375, 3.8118896484375, 4.1572265625, 4.5025634765625, 4.847900390625, 5.1932373046875, 5.53857421875, 5.8839111328125, 6.229248046875, 6.5745849609375, 6.919921875, 7.2652587890625, 7.610595703125, 7.9559326171875, 8.30126953125, 8.6466064453125, 8.991943359375, 9.3372802734375, 9.6826171875, 10.0279541015625, 10.373291015625, 10.7186279296875, 11.06396484375, 11.4093017578125, 11.754638671875, 12.0999755859375, 12.4453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 6.0, 10.0, 3.0, 16.0, 14.0, 14.0, 13.0, 21.0, 23.0, 23.0, 21.0, 35.0, 41.0, 43.0, 59.0, 48.0, 45.0, 52.0, 55.0, 45.0, 51.0, 47.0, 34.0, 32.0, 26.0, 38.0, 32.0, 27.0, 25.0, 17.0, 10.0, 9.0, 12.0, 6.0, 11.0, 10.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.078125, -7.8248291015625, -7.571533203125, -7.3182373046875, -7.06494140625, -6.8116455078125, -6.558349609375, -6.3050537109375, -6.0517578125, -5.7984619140625, -5.545166015625, -5.2918701171875, -5.03857421875, -4.7852783203125, -4.531982421875, -4.2786865234375, -4.025390625, -3.7720947265625, -3.518798828125, -3.2655029296875, -3.01220703125, -2.7589111328125, -2.505615234375, -2.2523193359375, -1.9990234375, -1.7457275390625, -1.492431640625, -1.2391357421875, -0.98583984375, -0.7325439453125, -0.479248046875, -0.2259521484375, 0.02734375, 0.2806396484375, 0.533935546875, 0.7872314453125, 1.04052734375, 1.2938232421875, 1.547119140625, 1.8004150390625, 2.0537109375, 2.3070068359375, 2.560302734375, 2.8135986328125, 3.06689453125, 3.3201904296875, 3.573486328125, 3.8267822265625, 4.080078125, 4.3333740234375, 4.586669921875, 4.8399658203125, 5.09326171875, 5.3465576171875, 5.599853515625, 5.8531494140625, 6.1064453125, 6.3597412109375, 6.613037109375, 6.8663330078125, 7.11962890625, 7.3729248046875, 7.626220703125, 7.8795166015625, 8.1328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 11.0, 11.0, 22.0, 31.0, 30.0, 73.0, 61.0, 135.0, 224.0, 494.0, 948.0, 2163.0, 6035.0, 22895.0, 119796.0, 561229.0, 271580.0, 46016.0, 10605.0, 3380.0, 1343.0, 639.0, 339.0, 182.0, 125.0, 63.0, 36.0, 16.0, 25.0, 7.0, 7.0, 10.0, 2.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0859375, -3.95294189453125, -3.8199462890625, -3.68695068359375, -3.553955078125, -3.42095947265625, -3.2879638671875, -3.15496826171875, -3.02197265625, -2.88897705078125, -2.7559814453125, -2.62298583984375, -2.489990234375, -2.35699462890625, -2.2239990234375, -2.09100341796875, -1.9580078125, -1.82501220703125, -1.6920166015625, -1.55902099609375, -1.426025390625, -1.29302978515625, -1.1600341796875, -1.02703857421875, -0.89404296875, -0.76104736328125, -0.6280517578125, -0.49505615234375, -0.362060546875, -0.22906494140625, -0.0960693359375, 0.03692626953125, 0.169921875, 0.30291748046875, 0.4359130859375, 0.56890869140625, 0.701904296875, 0.83489990234375, 0.9678955078125, 1.10089111328125, 1.23388671875, 1.36688232421875, 1.4998779296875, 1.63287353515625, 1.765869140625, 1.89886474609375, 2.0318603515625, 2.16485595703125, 2.2978515625, 2.43084716796875, 2.5638427734375, 2.69683837890625, 2.829833984375, 2.96282958984375, 3.0958251953125, 3.22882080078125, 3.36181640625, 3.49481201171875, 3.6278076171875, 3.76080322265625, 3.893798828125, 4.02679443359375, 4.1597900390625, 4.29278564453125, 4.42578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 9.0, 2.0, 2.0, 6.0, 4.0, 10.0, 10.0, 11.0, 16.0, 31.0, 41.0, 44.0, 56.0, 70.0, 107.0, 147.0, 96.0, 83.0, 64.0, 55.0, 36.0, 39.0, 17.0, 16.0, 10.0, 10.0, 9.0, 3.0, 0.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005578994750976562, -0.0005307048559188843, -0.0005035102367401123, -0.00047631561756134033, -0.00044912099838256836, -0.0004219263792037964, -0.0003947317600250244, -0.00036753714084625244, -0.00034034252166748047, -0.0003131479024887085, -0.0002859532833099365, -0.00025875866413116455, -0.00023156404495239258, -0.0002043694257736206, -0.00017717480659484863, -0.00014998018741607666, -0.0001227855682373047, -9.559094905853271e-05, -6.839632987976074e-05, -4.120171070098877e-05, -1.4007091522216797e-05, 1.3187527656555176e-05, 4.038214683532715e-05, 6.757676601409912e-05, 9.47713851928711e-05, 0.00012196600437164307, 0.00014916062355041504, 0.000176355242729187, 0.00020354986190795898, 0.00023074448108673096, 0.00025793910026550293, 0.0002851337194442749, 0.0003123283386230469, 0.00033952295780181885, 0.0003667175769805908, 0.0003939121961593628, 0.00042110681533813477, 0.00044830143451690674, 0.0004754960536956787, 0.0005026906728744507, 0.0005298852920532227, 0.0005570799112319946, 0.0005842745304107666, 0.0006114691495895386, 0.0006386637687683105, 0.0006658583879470825, 0.0006930530071258545, 0.0007202476263046265, 0.0007474422454833984, 0.0007746368646621704, 0.0008018314838409424, 0.0008290261030197144, 0.0008562207221984863, 0.0008834153413772583, 0.0009106099605560303, 0.0009378045797348022, 0.0009649991989135742, 0.0009921938180923462, 0.0010193884372711182, 0.0010465830564498901, 0.0010737776756286621, 0.001100972294807434, 0.001128166913986206, 0.001155361533164978, 0.00118255615234375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 8.0, 10.0, 10.0, 24.0, 31.0, 46.0, 77.0, 148.0, 262.0, 621.0, 1370.0, 4890.0, 33072.0, 522216.0, 450583.0, 28251.0, 4451.0, 1346.0, 561.0, 255.0, 126.0, 67.0, 41.0, 31.0, 12.0, 7.0, 12.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.3671875, -7.156494140625, -6.94580078125, -6.735107421875, -6.5244140625, -6.313720703125, -6.10302734375, -5.892333984375, -5.681640625, -5.470947265625, -5.26025390625, -5.049560546875, -4.8388671875, -4.628173828125, -4.41748046875, -4.206787109375, -3.99609375, -3.785400390625, -3.57470703125, -3.364013671875, -3.1533203125, -2.942626953125, -2.73193359375, -2.521240234375, -2.310546875, -2.099853515625, -1.88916015625, -1.678466796875, -1.4677734375, -1.257080078125, -1.04638671875, -0.835693359375, -0.625, -0.414306640625, -0.20361328125, 0.007080078125, 0.2177734375, 0.428466796875, 0.63916015625, 0.849853515625, 1.060546875, 1.271240234375, 1.48193359375, 1.692626953125, 1.9033203125, 2.114013671875, 2.32470703125, 2.535400390625, 2.74609375, 2.956787109375, 3.16748046875, 3.378173828125, 3.5888671875, 3.799560546875, 4.01025390625, 4.220947265625, 4.431640625, 4.642333984375, 4.85302734375, 5.063720703125, 5.2744140625, 5.485107421875, 5.69580078125, 5.906494140625, 6.1171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 19.0, 26.0, 31.0, 31.0, 63.0, 74.0, 75.0, 95.0, 96.0, 120.0, 80.0, 86.0, 38.0, 44.0, 26.0, 17.0, 14.0, 12.0, 10.0, 4.0, 10.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.340667724609375, -5.20867919921875, -5.076690673828125, -4.9447021484375, -4.812713623046875, -4.68072509765625, -4.548736572265625, -4.416748046875, -4.284759521484375, -4.15277099609375, -4.020782470703125, -3.8887939453125, -3.756805419921875, -3.62481689453125, -3.492828369140625, -3.36083984375, -3.228851318359375, -3.09686279296875, -2.964874267578125, -2.8328857421875, -2.700897216796875, -2.56890869140625, -2.436920166015625, -2.304931640625, -2.172943115234375, -2.04095458984375, -1.908966064453125, -1.7769775390625, -1.644989013671875, -1.51300048828125, -1.381011962890625, -1.2490234375, -1.117034912109375, -0.98504638671875, -0.853057861328125, -0.7210693359375, -0.589080810546875, -0.45709228515625, -0.325103759765625, -0.193115234375, -0.061126708984375, 0.07086181640625, 0.202850341796875, 0.3348388671875, 0.466827392578125, 0.59881591796875, 0.730804443359375, 0.86279296875, 0.994781494140625, 1.12677001953125, 1.258758544921875, 1.3907470703125, 1.522735595703125, 1.65472412109375, 1.786712646484375, 1.918701171875, 2.050689697265625, 2.18267822265625, 2.314666748046875, 2.4466552734375, 2.578643798828125, 2.71063232421875, 2.842620849609375, 2.974609375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 10.0, 11.0, 37.0, 104.0, 181.0, 224.0, 204.0, 131.0, 61.0, 24.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-98.09187316894531, -95.1873779296875, -92.28288269042969, -89.3783950805664, -86.4738998413086, -83.56940460205078, -80.6649169921875, -77.76042175292969, -74.85592651367188, -71.95143127441406, -69.04693603515625, -66.14244842529297, -63.237953186035156, -60.333457946777344, -57.4289665222168, -54.52447509765625, -51.61997985839844, -48.715484619140625, -45.81099319458008, -42.90650177001953, -40.00200653076172, -37.097511291503906, -34.19301986694336, -31.28852653503418, -28.384033203125, -25.47953987121582, -22.57504653930664, -19.67055320739746, -16.76605987548828, -13.861566543579102, -10.957073211669922, -8.052579879760742, -5.1480865478515625, -2.243593215942383, 0.6609001159667969, 3.5653934478759766, 6.469886779785156, 9.374380111694336, 12.278873443603516, 15.183366775512695, 18.087860107421875, 20.992353439331055, 23.896846771240234, 26.801340103149414, 29.705833435058594, 32.610328674316406, 35.51482009887695, 38.4193115234375, 41.32380676269531, 44.228302001953125, 47.13279342651367, 50.03728485107422, 52.94178009033203, 55.846275329589844, 58.75076675415039, 61.65525817871094, 64.55975341796875, 67.46424865722656, 70.36874389648438, 73.27323150634766, 76.17772674560547, 79.08222198486328, 81.98670959472656, 84.89120483398438, 87.79570007324219]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 14.0, 11.0, 8.0, 17.0, 10.0, 17.0, 22.0, 34.0, 29.0, 31.0, 33.0, 35.0, 45.0, 50.0, 47.0, 52.0, 43.0, 50.0, 50.0, 60.0, 33.0, 40.0, 38.0, 24.0, 30.0, 26.0, 24.0, 21.0, 17.0, 10.0, 7.0, 20.0, 12.0, 5.0, 10.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-42.81682586669922, -41.53522491455078, -40.25362014770508, -38.97201919555664, -37.69041442871094, -36.4088134765625, -35.12721252441406, -33.84560775756836, -32.56400680541992, -31.28240394592285, -30.00080108642578, -28.719200134277344, -27.437597274780273, -26.155994415283203, -24.874391555786133, -23.592788696289062, -22.311185836791992, -21.029582977294922, -19.74798011779785, -18.46637725830078, -17.184776306152344, -15.903173446655273, -14.621570587158203, -13.33996868133545, -12.058365821838379, -10.776762962341309, -9.495161056518555, -8.213558197021484, -6.931955814361572, -5.65035343170166, -4.36875057220459, -3.087148666381836, -1.8055458068847656, -0.523943305015564, 0.7576591968536377, 2.039261817932129, 3.320864200592041, 4.602466583251953, 5.884069442749023, 7.165671348571777, 8.447274208068848, 9.728877067565918, 11.010478973388672, 12.292081832885742, 13.573684692382812, 14.855286598205566, 16.136890411376953, 17.41849136352539, 18.70009422302246, 19.98169708251953, 21.2632999420166, 22.544902801513672, 23.82650375366211, 25.10810661315918, 26.38970947265625, 27.671310424804688, 28.95291519165039, 30.23451805114746, 31.51612091064453, 32.79772186279297, 34.07932662963867, 35.36092758178711, 36.64253234863281, 37.92413330078125, 39.20573425292969]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 9.0, 23.0, 23.0, 37.0, 59.0, 92.0, 137.0, 229.0, 405.0, 732.0, 1401.0, 2870.0, 7562.0, 30767.0, 3574601.0, 535839.0, 26907.0, 6961.0, 2689.0, 1235.0, 672.0, 388.0, 227.0, 144.0, 84.0, 55.0, 33.0, 29.0, 26.0, 16.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2890625, -9.986083984375, -9.68310546875, -9.380126953125, -9.0771484375, -8.774169921875, -8.47119140625, -8.168212890625, -7.865234375, -7.562255859375, -7.25927734375, -6.956298828125, -6.6533203125, -6.350341796875, -6.04736328125, -5.744384765625, -5.44140625, -5.138427734375, -4.83544921875, -4.532470703125, -4.2294921875, -3.926513671875, -3.62353515625, -3.320556640625, -3.017578125, -2.714599609375, -2.41162109375, -2.108642578125, -1.8056640625, -1.502685546875, -1.19970703125, -0.896728515625, -0.59375, -0.290771484375, 0.01220703125, 0.315185546875, 0.6181640625, 0.921142578125, 1.22412109375, 1.527099609375, 1.830078125, 2.133056640625, 2.43603515625, 2.739013671875, 3.0419921875, 3.344970703125, 3.64794921875, 3.950927734375, 4.25390625, 4.556884765625, 4.85986328125, 5.162841796875, 5.4658203125, 5.768798828125, 6.07177734375, 6.374755859375, 6.677734375, 6.980712890625, 7.28369140625, 7.586669921875, 7.8896484375, 8.192626953125, 8.49560546875, 8.798583984375, 9.1015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 9.0, 7.0, 15.0, 12.0, 23.0, 26.0, 27.0, 34.0, 39.0, 41.0, 53.0, 42.0, 40.0, 62.0, 53.0, 61.0, 46.0, 57.0, 53.0, 43.0, 38.0, 35.0, 27.0, 36.0, 33.0, 19.0, 15.0, 17.0, 8.0, 9.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.17578125, -2.11541748046875, -2.0550537109375, -1.99468994140625, -1.934326171875, -1.87396240234375, -1.8135986328125, -1.75323486328125, -1.69287109375, -1.63250732421875, -1.5721435546875, -1.51177978515625, -1.451416015625, -1.39105224609375, -1.3306884765625, -1.27032470703125, -1.2099609375, -1.14959716796875, -1.0892333984375, -1.02886962890625, -0.968505859375, -0.90814208984375, -0.8477783203125, -0.78741455078125, -0.72705078125, -0.66668701171875, -0.6063232421875, -0.54595947265625, -0.485595703125, -0.42523193359375, -0.3648681640625, -0.30450439453125, -0.244140625, -0.18377685546875, -0.1234130859375, -0.06304931640625, -0.002685546875, 0.05767822265625, 0.1180419921875, 0.17840576171875, 0.23876953125, 0.29913330078125, 0.3594970703125, 0.41986083984375, 0.480224609375, 0.54058837890625, 0.6009521484375, 0.66131591796875, 0.7216796875, 0.78204345703125, 0.8424072265625, 0.90277099609375, 0.963134765625, 1.02349853515625, 1.0838623046875, 1.14422607421875, 1.20458984375, 1.26495361328125, 1.3253173828125, 1.38568115234375, 1.446044921875, 1.50640869140625, 1.5667724609375, 1.62713623046875, 1.6875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 1.0, 7.0, 7.0, 8.0, 19.0, 18.0, 21.0, 27.0, 45.0, 58.0, 81.0, 91.0, 167.0, 290.0, 457.0, 985.0, 2260.0, 6976.0, 34938.0, 3865111.0, 256657.0, 18057.0, 4542.0, 1617.0, 711.0, 378.0, 229.0, 130.0, 96.0, 85.0, 42.0, 44.0, 34.0, 25.0, 14.0, 14.0, 12.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-16.171875, -15.75537109375, -15.3388671875, -14.92236328125, -14.505859375, -14.08935546875, -13.6728515625, -13.25634765625, -12.83984375, -12.42333984375, -12.0068359375, -11.59033203125, -11.173828125, -10.75732421875, -10.3408203125, -9.92431640625, -9.5078125, -9.09130859375, -8.6748046875, -8.25830078125, -7.841796875, -7.42529296875, -7.0087890625, -6.59228515625, -6.17578125, -5.75927734375, -5.3427734375, -4.92626953125, -4.509765625, -4.09326171875, -3.6767578125, -3.26025390625, -2.84375, -2.42724609375, -2.0107421875, -1.59423828125, -1.177734375, -0.76123046875, -0.3447265625, 0.07177734375, 0.48828125, 0.90478515625, 1.3212890625, 1.73779296875, 2.154296875, 2.57080078125, 2.9873046875, 3.40380859375, 3.8203125, 4.23681640625, 4.6533203125, 5.06982421875, 5.486328125, 5.90283203125, 6.3193359375, 6.73583984375, 7.15234375, 7.56884765625, 7.9853515625, 8.40185546875, 8.818359375, 9.23486328125, 9.6513671875, 10.06787109375, 10.484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 10.0, 9.0, 13.0, 18.0, 47.0, 116.0, 443.0, 3148.0, 148.0, 58.0, 32.0, 13.0, 11.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.93359375, -2.839599609375, -2.74560546875, -2.651611328125, -2.5576171875, -2.463623046875, -2.36962890625, -2.275634765625, -2.181640625, -2.087646484375, -1.99365234375, -1.899658203125, -1.8056640625, -1.711669921875, -1.61767578125, -1.523681640625, -1.4296875, -1.335693359375, -1.24169921875, -1.147705078125, -1.0537109375, -0.959716796875, -0.86572265625, -0.771728515625, -0.677734375, -0.583740234375, -0.48974609375, -0.395751953125, -0.3017578125, -0.207763671875, -0.11376953125, -0.019775390625, 0.07421875, 0.168212890625, 0.26220703125, 0.356201171875, 0.4501953125, 0.544189453125, 0.63818359375, 0.732177734375, 0.826171875, 0.920166015625, 1.01416015625, 1.108154296875, 1.2021484375, 1.296142578125, 1.39013671875, 1.484130859375, 1.578125, 1.672119140625, 1.76611328125, 1.860107421875, 1.9541015625, 2.048095703125, 2.14208984375, 2.236083984375, 2.330078125, 2.424072265625, 2.51806640625, 2.612060546875, 2.7060546875, 2.800048828125, 2.89404296875, 2.988037109375, 3.08203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 8.0, 16.0, 20.0, 68.0, 93.0, 141.0, 178.0, 145.0, 132.0, 95.0, 44.0, 26.0, 13.0, 12.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.729338645935059, -11.368534088134766, -11.007730484008789, -10.646925926208496, -10.286121368408203, -9.925317764282227, -9.564513206481934, -9.20370864868164, -8.842905044555664, -8.482100486755371, -8.121296882629395, -7.760492324829102, -7.399688243865967, -7.038884162902832, -6.678079605102539, -6.317275524139404, -5.9564714431762695, -5.595667362213135, -5.23486328125, -4.874058723449707, -4.513254642486572, -4.1524505615234375, -3.7916462421417236, -3.4308419227600098, -3.070037841796875, -2.7092337608337402, -2.3484294414520264, -1.987625241279602, -1.6268210411071777, -1.2660168409347534, -0.9052126407623291, -0.5444083213806152, -0.18360328674316406, 0.17720091342926025, 0.5380051136016846, 0.8988093137741089, 1.2596135139465332, 1.6204177141189575, 1.9812219142913818, 2.3420262336730957, 2.7028303146362305, 3.0636343955993652, 3.424438714981079, 3.785243034362793, 4.146047115325928, 4.5068511962890625, 4.8676557540893555, 5.22845983505249, 5.589263916015625, 5.95006799697876, 6.3108720779418945, 6.6716766357421875, 7.032480716705322, 7.393284797668457, 7.75408935546875, 8.114892959594727, 8.47569751739502, 8.836502075195312, 9.197305679321289, 9.558110237121582, 9.918914794921875, 10.279718399047852, 10.640522956848145, 11.001327514648438, 11.362131118774414]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 8.0, 9.0, 8.0, 8.0, 12.0, 8.0, 15.0, 14.0, 19.0, 17.0, 21.0, 27.0, 25.0, 27.0, 45.0, 29.0, 33.0, 44.0, 51.0, 28.0, 41.0, 31.0, 43.0, 37.0, 37.0, 34.0, 43.0, 29.0, 35.0, 35.0, 29.0, 25.0, 20.0, 19.0, 20.0, 17.0, 11.0, 8.0, 10.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.480663299560547, -4.341196537017822, -4.201730251312256, -4.062263488769531, -3.922797203063965, -3.7833304405212402, -3.6438639163970947, -3.504397392272949, -3.3649308681488037, -3.225464344024658, -3.0859978199005127, -2.946531295776367, -2.8070645332336426, -2.667598247528076, -2.5281314849853516, -2.388664960861206, -2.2491984367370605, -2.109731912612915, -1.9702653884887695, -1.8307987451553345, -1.691332221031189, -1.5518656969070435, -1.4123990535736084, -1.272932529449463, -1.1334660053253174, -0.9939994812011719, -0.8545328974723816, -0.7150663137435913, -0.5755997896194458, -0.4361332654953003, -0.29666668176651, -0.15720009803771973, -0.017734050750732422, 0.12173250317573547, 0.26119905710220337, 0.40066561102867126, 0.5401321649551392, 0.6795986890792847, 0.819065272808075, 0.9585318565368652, 1.0979983806610107, 1.2374649047851562, 1.3769314289093018, 1.5163980722427368, 1.6558645963668823, 1.7953311204910278, 1.934797763824463, 2.0742642879486084, 2.213730812072754, 2.3531973361968994, 2.492663860321045, 2.6321303844451904, 2.771596908569336, 2.9110636711120605, 3.050530195236206, 3.1899967193603516, 3.329463243484497, 3.4689297676086426, 3.608396291732788, 3.7478628158569336, 3.887329578399658, 4.026795864105225, 4.166262626647949, 4.305728912353516, 4.44519567489624]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 9.0, 6.0, 14.0, 19.0, 23.0, 34.0, 42.0, 73.0, 130.0, 261.0, 642.0, 1670.0, 4574.0, 12930.0, 38224.0, 108880.0, 262650.0, 336515.0, 180437.0, 65868.0, 22815.0, 8016.0, 2734.0, 1032.0, 446.0, 222.0, 100.0, 56.0, 41.0, 25.0, 14.0, 11.0, 13.0, 2.0, 10.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.40625, -5.2529296875, -5.099609375, -4.9462890625, -4.79296875, -4.6396484375, -4.486328125, -4.3330078125, -4.1796875, -4.0263671875, -3.873046875, -3.7197265625, -3.56640625, -3.4130859375, -3.259765625, -3.1064453125, -2.953125, -2.7998046875, -2.646484375, -2.4931640625, -2.33984375, -2.1865234375, -2.033203125, -1.8798828125, -1.7265625, -1.5732421875, -1.419921875, -1.2666015625, -1.11328125, -0.9599609375, -0.806640625, -0.6533203125, -0.5, -0.3466796875, -0.193359375, -0.0400390625, 0.11328125, 0.2666015625, 0.419921875, 0.5732421875, 0.7265625, 0.8798828125, 1.033203125, 1.1865234375, 1.33984375, 1.4931640625, 1.646484375, 1.7998046875, 1.953125, 2.1064453125, 2.259765625, 2.4130859375, 2.56640625, 2.7197265625, 2.873046875, 3.0263671875, 3.1796875, 3.3330078125, 3.486328125, 3.6396484375, 3.79296875, 3.9462890625, 4.099609375, 4.2529296875, 4.40625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 7.0, 12.0, 17.0, 19.0, 14.0, 24.0, 23.0, 35.0, 35.0, 39.0, 56.0, 43.0, 39.0, 63.0, 44.0, 51.0, 38.0, 51.0, 52.0, 40.0, 43.0, 42.0, 48.0, 45.0, 27.0, 18.0, 12.0, 12.0, 9.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.298828125, -2.233367919921875, -2.16790771484375, -2.102447509765625, -2.0369873046875, -1.971527099609375, -1.90606689453125, -1.840606689453125, -1.775146484375, -1.709686279296875, -1.64422607421875, -1.578765869140625, -1.5133056640625, -1.447845458984375, -1.38238525390625, -1.316925048828125, -1.25146484375, -1.186004638671875, -1.12054443359375, -1.055084228515625, -0.9896240234375, -0.924163818359375, -0.85870361328125, -0.793243408203125, -0.727783203125, -0.662322998046875, -0.59686279296875, -0.531402587890625, -0.4659423828125, -0.400482177734375, -0.33502197265625, -0.269561767578125, -0.2041015625, -0.138641357421875, -0.07318115234375, -0.007720947265625, 0.0577392578125, 0.123199462890625, 0.18865966796875, 0.254119873046875, 0.319580078125, 0.385040283203125, 0.45050048828125, 0.515960693359375, 0.5814208984375, 0.646881103515625, 0.71234130859375, 0.777801513671875, 0.84326171875, 0.908721923828125, 0.97418212890625, 1.039642333984375, 1.1051025390625, 1.170562744140625, 1.23602294921875, 1.301483154296875, 1.366943359375, 1.432403564453125, 1.49786376953125, 1.563323974609375, 1.6287841796875, 1.694244384765625, 1.75970458984375, 1.825164794921875, 1.890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 9.0, 16.0, 21.0, 28.0, 40.0, 63.0, 93.0, 145.0, 216.0, 322.0, 504.0, 936.0, 1731.0, 5392.0, 46582.0, 630791.0, 332322.0, 22281.0, 3616.0, 1381.0, 694.0, 465.0, 277.0, 186.0, 137.0, 89.0, 55.0, 32.0, 26.0, 27.0, 14.0, 8.0, 12.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.546875, -11.172607421875, -10.79833984375, -10.424072265625, -10.0498046875, -9.675537109375, -9.30126953125, -8.927001953125, -8.552734375, -8.178466796875, -7.80419921875, -7.429931640625, -7.0556640625, -6.681396484375, -6.30712890625, -5.932861328125, -5.55859375, -5.184326171875, -4.81005859375, -4.435791015625, -4.0615234375, -3.687255859375, -3.31298828125, -2.938720703125, -2.564453125, -2.190185546875, -1.81591796875, -1.441650390625, -1.0673828125, -0.693115234375, -0.31884765625, 0.055419921875, 0.4296875, 0.803955078125, 1.17822265625, 1.552490234375, 1.9267578125, 2.301025390625, 2.67529296875, 3.049560546875, 3.423828125, 3.798095703125, 4.17236328125, 4.546630859375, 4.9208984375, 5.295166015625, 5.66943359375, 6.043701171875, 6.41796875, 6.792236328125, 7.16650390625, 7.540771484375, 7.9150390625, 8.289306640625, 8.66357421875, 9.037841796875, 9.412109375, 9.786376953125, 10.16064453125, 10.534912109375, 10.9091796875, 11.283447265625, 11.65771484375, 12.031982421875, 12.40625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 14.0, 20.0, 23.0, 33.0, 44.0, 54.0, 66.0, 70.0, 67.0, 92.0, 82.0, 85.0, 58.0, 64.0, 56.0, 45.0, 45.0, 25.0, 24.0, 8.0, 5.0, 10.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0, -18.4891357421875, -17.978271484375, -17.4674072265625, -16.95654296875, -16.4456787109375, -15.934814453125, -15.4239501953125, -14.9130859375, -14.4022216796875, -13.891357421875, -13.3804931640625, -12.86962890625, -12.3587646484375, -11.847900390625, -11.3370361328125, -10.826171875, -10.3153076171875, -9.804443359375, -9.2935791015625, -8.78271484375, -8.2718505859375, -7.760986328125, -7.2501220703125, -6.7392578125, -6.2283935546875, -5.717529296875, -5.2066650390625, -4.69580078125, -4.1849365234375, -3.674072265625, -3.1632080078125, -2.65234375, -2.1414794921875, -1.630615234375, -1.1197509765625, -0.60888671875, -0.0980224609375, 0.412841796875, 0.9237060546875, 1.4345703125, 1.9454345703125, 2.456298828125, 2.9671630859375, 3.47802734375, 3.9888916015625, 4.499755859375, 5.0106201171875, 5.521484375, 6.0323486328125, 6.543212890625, 7.0540771484375, 7.56494140625, 8.0758056640625, 8.586669921875, 9.0975341796875, 9.6083984375, 10.1192626953125, 10.630126953125, 11.1409912109375, 11.65185546875, 12.1627197265625, 12.673583984375, 13.1844482421875, 13.6953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 5.0, 4.0, 12.0, 8.0, 15.0, 23.0, 23.0, 31.0, 62.0, 64.0, 90.0, 171.0, 339.0, 616.0, 1190.0, 2872.0, 9093.0, 37469.0, 184775.0, 534340.0, 216940.0, 43870.0, 10437.0, 3228.0, 1378.0, 625.0, 323.0, 180.0, 110.0, 71.0, 52.0, 35.0, 26.0, 26.0, 11.0, 9.0, 11.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.83984375, -2.743743896484375, -2.64764404296875, -2.551544189453125, -2.4554443359375, -2.359344482421875, -2.26324462890625, -2.167144775390625, -2.071044921875, -1.974945068359375, -1.87884521484375, -1.782745361328125, -1.6866455078125, -1.590545654296875, -1.49444580078125, -1.398345947265625, -1.30224609375, -1.206146240234375, -1.11004638671875, -1.013946533203125, -0.9178466796875, -0.821746826171875, -0.72564697265625, -0.629547119140625, -0.533447265625, -0.437347412109375, -0.34124755859375, -0.245147705078125, -0.1490478515625, -0.052947998046875, 0.04315185546875, 0.139251708984375, 0.2353515625, 0.331451416015625, 0.42755126953125, 0.523651123046875, 0.6197509765625, 0.715850830078125, 0.81195068359375, 0.908050537109375, 1.004150390625, 1.100250244140625, 1.19635009765625, 1.292449951171875, 1.3885498046875, 1.484649658203125, 1.58074951171875, 1.676849365234375, 1.77294921875, 1.869049072265625, 1.96514892578125, 2.061248779296875, 2.1573486328125, 2.253448486328125, 2.34954833984375, 2.445648193359375, 2.541748046875, 2.637847900390625, 2.73394775390625, 2.830047607421875, 2.9261474609375, 3.022247314453125, 3.11834716796875, 3.214447021484375, 3.310546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 10.0, 11.0, 12.0, 18.0, 21.0, 21.0, 30.0, 48.0, 54.0, 66.0, 70.0, 81.0, 74.0, 79.0, 75.0, 71.0, 63.0, 41.0, 40.0, 30.0, 15.0, 17.0, 12.0, 9.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042057037353515625, -0.00040284544229507446, -0.0003851205110549927, -0.0003673955798149109, -0.0003496706485748291, -0.0003319457173347473, -0.00031422078609466553, -0.00029649585485458374, -0.00027877092361450195, -0.00026104599237442017, -0.00024332106113433838, -0.0002255961298942566, -0.0002078711986541748, -0.00019014626741409302, -0.00017242133617401123, -0.00015469640493392944, -0.00013697147369384766, -0.00011924654245376587, -0.00010152161121368408, -8.37966799736023e-05, -6.607174873352051e-05, -4.834681749343872e-05, -3.0621886253356934e-05, -1.2896955013275146e-05, 4.827976226806641e-06, 2.2552907466888428e-05, 4.0277838706970215e-05, 5.8002769947052e-05, 7.572770118713379e-05, 9.345263242721558e-05, 0.00011117756366729736, 0.00012890249490737915, 0.00014662742614746094, 0.00016435235738754272, 0.0001820772886276245, 0.0001998022198677063, 0.00021752715110778809, 0.00023525208234786987, 0.00025297701358795166, 0.00027070194482803345, 0.00028842687606811523, 0.000306151807308197, 0.0003238767385482788, 0.0003416016697883606, 0.0003593266010284424, 0.00037705153226852417, 0.00039477646350860596, 0.00041250139474868774, 0.00043022632598876953, 0.0004479512572288513, 0.0004656761884689331, 0.0004834011197090149, 0.0005011260509490967, 0.0005188509821891785, 0.0005365759134292603, 0.000554300844669342, 0.0005720257759094238, 0.0005897507071495056, 0.0006074756383895874, 0.0006252005696296692, 0.000642925500869751, 0.0006606504321098328, 0.0006783753633499146, 0.0006961002945899963, 0.0007138252258300781]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 5.0, 6.0, 15.0, 13.0, 23.0, 32.0, 55.0, 74.0, 102.0, 210.0, 361.0, 722.0, 1553.0, 4250.0, 19366.0, 172269.0, 669361.0, 155250.0, 17801.0, 3942.0, 1491.0, 733.0, 376.0, 182.0, 104.0, 63.0, 57.0, 41.0, 17.0, 22.0, 12.0, 10.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.56640625, -4.4339599609375, -4.301513671875, -4.1690673828125, -4.03662109375, -3.9041748046875, -3.771728515625, -3.6392822265625, -3.5068359375, -3.3743896484375, -3.241943359375, -3.1094970703125, -2.97705078125, -2.8446044921875, -2.712158203125, -2.5797119140625, -2.447265625, -2.3148193359375, -2.182373046875, -2.0499267578125, -1.91748046875, -1.7850341796875, -1.652587890625, -1.5201416015625, -1.3876953125, -1.2552490234375, -1.122802734375, -0.9903564453125, -0.85791015625, -0.7254638671875, -0.593017578125, -0.4605712890625, -0.328125, -0.1956787109375, -0.063232421875, 0.0692138671875, 0.20166015625, 0.3341064453125, 0.466552734375, 0.5989990234375, 0.7314453125, 0.8638916015625, 0.996337890625, 1.1287841796875, 1.26123046875, 1.3936767578125, 1.526123046875, 1.6585693359375, 1.791015625, 1.9234619140625, 2.055908203125, 2.1883544921875, 2.32080078125, 2.4532470703125, 2.585693359375, 2.7181396484375, 2.8505859375, 2.9830322265625, 3.115478515625, 3.2479248046875, 3.38037109375, 3.5128173828125, 3.645263671875, 3.7777099609375, 3.91015625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 10.0, 16.0, 23.0, 48.0, 60.0, 82.0, 103.0, 130.0, 116.0, 129.0, 90.0, 69.0, 49.0, 34.0, 24.0, 12.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0234375, -4.8621826171875, -4.700927734375, -4.5396728515625, -4.37841796875, -4.2171630859375, -4.055908203125, -3.8946533203125, -3.7333984375, -3.5721435546875, -3.410888671875, -3.2496337890625, -3.08837890625, -2.9271240234375, -2.765869140625, -2.6046142578125, -2.443359375, -2.2821044921875, -2.120849609375, -1.9595947265625, -1.79833984375, -1.6370849609375, -1.475830078125, -1.3145751953125, -1.1533203125, -0.9920654296875, -0.830810546875, -0.6695556640625, -0.50830078125, -0.3470458984375, -0.185791015625, -0.0245361328125, 0.13671875, 0.2979736328125, 0.459228515625, 0.6204833984375, 0.78173828125, 0.9429931640625, 1.104248046875, 1.2655029296875, 1.4267578125, 1.5880126953125, 1.749267578125, 1.9105224609375, 2.07177734375, 2.2330322265625, 2.394287109375, 2.5555419921875, 2.716796875, 2.8780517578125, 3.039306640625, 3.2005615234375, 3.36181640625, 3.5230712890625, 3.684326171875, 3.8455810546875, 4.0068359375, 4.1680908203125, 4.329345703125, 4.4906005859375, 4.65185546875, 4.8131103515625, 4.974365234375, 5.1356201171875, 5.296875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 18.0, 97.0, 241.0, 333.0, 201.0, 81.0, 21.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.0122184753418, -55.79755401611328, -51.582889556884766, -47.36822509765625, -43.15355682373047, -38.93889617919922, -34.72422790527344, -30.509563446044922, -26.294898986816406, -22.08023452758789, -17.865570068359375, -13.650903701782227, -9.436239242553711, -5.221574783325195, -1.0069084167480469, 3.2077560424804688, 7.422420501708984, 11.6370849609375, 15.851750373840332, 20.066415786743164, 24.28108024597168, 28.495744705200195, 32.710411071777344, 36.92507553100586, 41.139739990234375, 45.35440444946289, 49.569068908691406, 53.78373718261719, 57.99839782714844, 62.21306610107422, 66.427734375, 70.64239501953125, 74.85707092285156, 79.07173919677734, 83.2863998413086, 87.50106811523438, 91.71572875976562, 95.9303970336914, 100.14506530761719, 104.35972595214844, 108.57438659667969, 112.78905487060547, 117.00371551513672, 121.2183837890625, 125.43304443359375, 129.647705078125, 133.8623809814453, 138.07704162597656, 142.29171752929688, 146.50637817382812, 150.72105407714844, 154.9357147216797, 159.15037536621094, 163.3650360107422, 167.5797119140625, 171.79437255859375, 176.009033203125, 180.22369384765625, 184.43836975097656, 188.6530303955078, 192.86769104003906, 197.0823516845703, 201.29702758789062, 205.51168823242188, 209.72634887695312]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 4.0, 4.0, 11.0, 13.0, 9.0, 12.0, 7.0, 13.0, 17.0, 19.0, 21.0, 27.0, 28.0, 22.0, 27.0, 26.0, 33.0, 41.0, 36.0, 53.0, 35.0, 50.0, 36.0, 38.0, 35.0, 34.0, 46.0, 35.0, 26.0, 30.0, 31.0, 17.0, 23.0, 29.0, 17.0, 15.0, 13.0, 14.0, 13.0, 4.0, 9.0, 3.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-37.893898010253906, -36.66217041015625, -35.43044662475586, -34.1987190246582, -32.96699523925781, -31.735267639160156, -30.503541946411133, -29.27181625366211, -28.040090560913086, -26.808364868164062, -25.57663917541504, -24.344913482666016, -23.11318588256836, -21.88146209716797, -20.649734497070312, -19.41800880432129, -18.186283111572266, -16.954557418823242, -15.722831726074219, -14.491105079650879, -13.259379386901855, -12.027653694152832, -10.795927047729492, -9.564201354980469, -8.332475662231445, -7.100749969482422, -5.86902379989624, -4.637297630310059, -3.405571937561035, -2.1738462448120117, -0.9421200752258301, 0.28960609436035156, 1.521331787109375, 2.7530577182769775, 3.98478364944458, 5.216509819030762, 6.448235511779785, 7.679961204528809, 8.911687850952148, 10.143413543701172, 11.375139236450195, 12.606864929199219, 13.838590621948242, 15.070317268371582, 16.302043914794922, 17.533767700195312, 18.76549530029297, 19.997220993041992, 21.228946685791016, 22.46067237854004, 23.692398071289062, 24.924123764038086, 26.15584945678711, 27.387577056884766, 28.61930274963379, 29.851028442382812, 31.082754135131836, 32.31447982788086, 33.546207427978516, 34.777931213378906, 36.00965881347656, 37.24138259887695, 38.47311019897461, 39.704833984375, 40.936561584472656]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 4.0, 10.0, 15.0, 25.0, 35.0, 52.0, 69.0, 92.0, 198.0, 271.0, 473.0, 818.0, 1590.0, 3420.0, 8562.0, 29608.0, 308762.0, 3771076.0, 48530.0, 11739.0, 4371.0, 2051.0, 1006.0, 569.0, 319.0, 191.0, 149.0, 88.0, 50.0, 50.0, 24.0, 20.0, 15.0, 7.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.86328125, -6.6356201171875, -6.407958984375, -6.1802978515625, -5.95263671875, -5.7249755859375, -5.497314453125, -5.2696533203125, -5.0419921875, -4.8143310546875, -4.586669921875, -4.3590087890625, -4.13134765625, -3.9036865234375, -3.676025390625, -3.4483642578125, -3.220703125, -2.9930419921875, -2.765380859375, -2.5377197265625, -2.31005859375, -2.0823974609375, -1.854736328125, -1.6270751953125, -1.3994140625, -1.1717529296875, -0.944091796875, -0.7164306640625, -0.48876953125, -0.2611083984375, -0.033447265625, 0.1942138671875, 0.421875, 0.6495361328125, 0.877197265625, 1.1048583984375, 1.33251953125, 1.5601806640625, 1.787841796875, 2.0155029296875, 2.2431640625, 2.4708251953125, 2.698486328125, 2.9261474609375, 3.15380859375, 3.3814697265625, 3.609130859375, 3.8367919921875, 4.064453125, 4.2921142578125, 4.519775390625, 4.7474365234375, 4.97509765625, 5.2027587890625, 5.430419921875, 5.6580810546875, 5.8857421875, 6.1134033203125, 6.341064453125, 6.5687255859375, 6.79638671875, 7.0240478515625, 7.251708984375, 7.4793701171875, 7.70703125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 11.0, 11.0, 10.0, 16.0, 21.0, 20.0, 29.0, 41.0, 40.0, 27.0, 52.0, 53.0, 40.0, 53.0, 64.0, 60.0, 49.0, 53.0, 44.0, 52.0, 39.0, 39.0, 30.0, 41.0, 19.0, 14.0, 16.0, 12.0, 14.0, 7.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.390625, -2.322174072265625, -2.25372314453125, -2.185272216796875, -2.1168212890625, -2.048370361328125, -1.97991943359375, -1.911468505859375, -1.843017578125, -1.774566650390625, -1.70611572265625, -1.637664794921875, -1.5692138671875, -1.500762939453125, -1.43231201171875, -1.363861083984375, -1.29541015625, -1.226959228515625, -1.15850830078125, -1.090057373046875, -1.0216064453125, -0.953155517578125, -0.88470458984375, -0.816253662109375, -0.747802734375, -0.679351806640625, -0.61090087890625, -0.542449951171875, -0.4739990234375, -0.405548095703125, -0.33709716796875, -0.268646240234375, -0.2001953125, -0.131744384765625, -0.06329345703125, 0.005157470703125, 0.0736083984375, 0.142059326171875, 0.21051025390625, 0.278961181640625, 0.347412109375, 0.415863037109375, 0.48431396484375, 0.552764892578125, 0.6212158203125, 0.689666748046875, 0.75811767578125, 0.826568603515625, 0.89501953125, 0.963470458984375, 1.03192138671875, 1.100372314453125, 1.1688232421875, 1.237274169921875, 1.30572509765625, 1.374176025390625, 1.442626953125, 1.511077880859375, 1.57952880859375, 1.647979736328125, 1.7164306640625, 1.784881591796875, 1.85333251953125, 1.921783447265625, 1.990234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 3.0, 8.0, 6.0, 11.0, 10.0, 16.0, 24.0, 37.0, 49.0, 75.0, 95.0, 137.0, 183.0, 283.0, 444.0, 661.0, 1016.0, 1682.0, 2983.0, 5507.0, 11660.0, 28471.0, 99883.0, 3498236.0, 441546.0, 60788.0, 20479.0, 8979.0, 4442.0, 2492.0, 1385.0, 885.0, 548.0, 367.0, 260.0, 190.0, 120.0, 98.0, 64.0, 42.0, 26.0, 24.0, 26.0, 15.0, 11.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.55859375, -5.39898681640625, -5.2393798828125, -5.07977294921875, -4.920166015625, -4.76055908203125, -4.6009521484375, -4.44134521484375, -4.28173828125, -4.12213134765625, -3.9625244140625, -3.80291748046875, -3.643310546875, -3.48370361328125, -3.3240966796875, -3.16448974609375, -3.0048828125, -2.84527587890625, -2.6856689453125, -2.52606201171875, -2.366455078125, -2.20684814453125, -2.0472412109375, -1.88763427734375, -1.72802734375, -1.56842041015625, -1.4088134765625, -1.24920654296875, -1.089599609375, -0.92999267578125, -0.7703857421875, -0.61077880859375, -0.451171875, -0.29156494140625, -0.1319580078125, 0.02764892578125, 0.187255859375, 0.34686279296875, 0.5064697265625, 0.66607666015625, 0.82568359375, 0.98529052734375, 1.1448974609375, 1.30450439453125, 1.464111328125, 1.62371826171875, 1.7833251953125, 1.94293212890625, 2.1025390625, 2.26214599609375, 2.4217529296875, 2.58135986328125, 2.740966796875, 2.90057373046875, 3.0601806640625, 3.21978759765625, 3.37939453125, 3.53900146484375, 3.6986083984375, 3.85821533203125, 4.017822265625, 4.17742919921875, 4.3370361328125, 4.49664306640625, 4.65625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 8.0, 16.0, 17.0, 21.0, 26.0, 54.0, 91.0, 234.0, 2660.0, 590.0, 137.0, 71.0, 38.0, 27.0, 21.0, 16.0, 12.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.69921875, -1.642242431640625, -1.58526611328125, -1.528289794921875, -1.4713134765625, -1.414337158203125, -1.35736083984375, -1.300384521484375, -1.243408203125, -1.186431884765625, -1.12945556640625, -1.072479248046875, -1.0155029296875, -0.958526611328125, -0.90155029296875, -0.844573974609375, -0.78759765625, -0.730621337890625, -0.67364501953125, -0.616668701171875, -0.5596923828125, -0.502716064453125, -0.44573974609375, -0.388763427734375, -0.331787109375, -0.274810791015625, -0.21783447265625, -0.160858154296875, -0.1038818359375, -0.046905517578125, 0.01007080078125, 0.067047119140625, 0.1240234375, 0.180999755859375, 0.23797607421875, 0.294952392578125, 0.3519287109375, 0.408905029296875, 0.46588134765625, 0.522857666015625, 0.579833984375, 0.636810302734375, 0.69378662109375, 0.750762939453125, 0.8077392578125, 0.864715576171875, 0.92169189453125, 0.978668212890625, 1.03564453125, 1.092620849609375, 1.14959716796875, 1.206573486328125, 1.2635498046875, 1.320526123046875, 1.37750244140625, 1.434478759765625, 1.491455078125, 1.548431396484375, 1.60540771484375, 1.662384033203125, 1.7193603515625, 1.776336669921875, 1.83331298828125, 1.890289306640625, 1.947265625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 8.0, 4.0, 6.0, 17.0, 18.0, 24.0, 31.0, 32.0, 45.0, 42.0, 55.0, 56.0, 87.0, 79.0, 69.0, 61.0, 55.0, 75.0, 51.0, 48.0, 29.0, 25.0, 21.0, 18.0, 11.0, 9.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.938452243804932, -5.767966270446777, -5.597479820251465, -5.426993370056152, -5.256507396697998, -5.086021423339844, -4.915534973144531, -4.745048522949219, -4.5745625495910645, -4.40407657623291, -4.233590126037598, -4.063103675842285, -3.892617702484131, -3.7221314907073975, -3.551645278930664, -3.3811590671539307, -3.2106728553771973, -3.040186643600464, -2.8697004318237305, -2.699214220046997, -2.5287280082702637, -2.3582417964935303, -2.187755584716797, -2.0172693729400635, -1.84678316116333, -1.6762969493865967, -1.5058107376098633, -1.3353245258331299, -1.1648383140563965, -0.9943521022796631, -0.8238658905029297, -0.6533796787261963, -0.4828929901123047, -0.3124067783355713, -0.1419205665588379, 0.028565645217895508, 0.1990518569946289, 0.3695380687713623, 0.5400242805480957, 0.7105104923248291, 0.8809967041015625, 1.051482915878296, 1.2219691276550293, 1.3924553394317627, 1.562941551208496, 1.7334277629852295, 1.903913974761963, 2.0744001865386963, 2.2448863983154297, 2.415372610092163, 2.5858588218688965, 2.75634503364563, 2.9268312454223633, 3.0973174571990967, 3.26780366897583, 3.4382898807525635, 3.608776092529297, 3.7792623043060303, 3.9497485160827637, 4.120234489440918, 4.2907209396362305, 4.461207389831543, 4.631693363189697, 4.802179336547852, 4.972665786743164]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 2.0, 8.0, 7.0, 11.0, 11.0, 14.0, 21.0, 15.0, 21.0, 26.0, 19.0, 30.0, 36.0, 36.0, 35.0, 33.0, 36.0, 42.0, 43.0, 45.0, 39.0, 36.0, 33.0, 43.0, 30.0, 31.0, 36.0, 33.0, 30.0, 26.0, 20.0, 27.0, 19.0, 25.0, 13.0, 11.0, 10.0, 13.0, 12.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.8562612533569336, -3.7202951908111572, -3.584329128265381, -3.4483633041381836, -3.3123972415924072, -3.176431179046631, -3.0404651165008545, -2.904499053955078, -2.768533229827881, -2.6325671672821045, -2.496601104736328, -2.360635280609131, -2.2246692180633545, -2.088703155517578, -1.9527370929718018, -1.8167710304260254, -1.680804967880249, -1.5448389053344727, -1.4088729619979858, -1.2729068994522095, -1.1369409561157227, -1.0009748935699463, -0.8650088310241699, -0.7290428280830383, -0.5930768251419067, -0.45711082220077515, -0.32114478945732117, -0.1851787567138672, -0.049212753772735596, 0.086753249168396, 0.22271931171417236, 0.35868531465530396, 0.49465131759643555, 0.6306173205375671, 0.7665833234786987, 0.9025493860244751, 1.038515329360962, 1.1744813919067383, 1.3104474544525146, 1.446413516998291, 1.5823794603347778, 1.7183455228805542, 1.854311466217041, 1.9902775287628174, 2.1262435913085938, 2.262209415435791, 2.3981757164001465, 2.5341415405273438, 2.67010760307312, 2.8060736656188965, 2.942039728164673, 3.078005790710449, 3.2139716148376465, 3.349937677383423, 3.485903739929199, 3.6218698024749756, 3.757835865020752, 3.8938019275665283, 4.029767990112305, 4.165733814239502, 4.301700115203857, 4.437665939331055, 4.57363224029541, 4.709598064422607, 4.845563888549805]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 9.0, 10.0, 15.0, 26.0, 42.0, 68.0, 113.0, 167.0, 290.0, 539.0, 959.0, 1810.0, 3399.0, 7026.0, 15071.0, 33315.0, 74000.0, 154808.0, 255181.0, 242305.0, 138492.0, 65133.0, 29303.0, 13493.0, 6206.0, 3149.0, 1641.0, 839.0, 467.0, 248.0, 154.0, 96.0, 65.0, 37.0, 26.0, 17.0, 15.0, 6.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.095703125, -2.99871826171875, -2.9017333984375, -2.80474853515625, -2.707763671875, -2.61077880859375, -2.5137939453125, -2.41680908203125, -2.31982421875, -2.22283935546875, -2.1258544921875, -2.02886962890625, -1.931884765625, -1.83489990234375, -1.7379150390625, -1.64093017578125, -1.5439453125, -1.44696044921875, -1.3499755859375, -1.25299072265625, -1.156005859375, -1.05902099609375, -0.9620361328125, -0.86505126953125, -0.76806640625, -0.67108154296875, -0.5740966796875, -0.47711181640625, -0.380126953125, -0.28314208984375, -0.1861572265625, -0.08917236328125, 0.0078125, 0.10479736328125, 0.2017822265625, 0.29876708984375, 0.395751953125, 0.49273681640625, 0.5897216796875, 0.68670654296875, 0.78369140625, 0.88067626953125, 0.9776611328125, 1.07464599609375, 1.171630859375, 1.26861572265625, 1.3656005859375, 1.46258544921875, 1.5595703125, 1.65655517578125, 1.7535400390625, 1.85052490234375, 1.947509765625, 2.04449462890625, 2.1414794921875, 2.23846435546875, 2.33544921875, 2.43243408203125, 2.5294189453125, 2.62640380859375, 2.723388671875, 2.82037353515625, 2.9173583984375, 3.01434326171875, 3.111328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 5.0, 10.0, 11.0, 31.0, 25.0, 17.0, 34.0, 30.0, 45.0, 56.0, 55.0, 59.0, 74.0, 70.0, 66.0, 65.0, 48.0, 57.0, 44.0, 52.0, 34.0, 17.0, 22.0, 19.0, 11.0, 12.0, 5.0, 1.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.777374267578125, -2.69146728515625, -2.605560302734375, -2.5196533203125, -2.433746337890625, -2.34783935546875, -2.261932373046875, -2.176025390625, -2.090118408203125, -2.00421142578125, -1.918304443359375, -1.8323974609375, -1.746490478515625, -1.66058349609375, -1.574676513671875, -1.48876953125, -1.402862548828125, -1.31695556640625, -1.231048583984375, -1.1451416015625, -1.059234619140625, -0.97332763671875, -0.887420654296875, -0.801513671875, -0.715606689453125, -0.62969970703125, -0.543792724609375, -0.4578857421875, -0.371978759765625, -0.28607177734375, -0.200164794921875, -0.1142578125, -0.028350830078125, 0.05755615234375, 0.143463134765625, 0.2293701171875, 0.315277099609375, 0.40118408203125, 0.487091064453125, 0.572998046875, 0.658905029296875, 0.74481201171875, 0.830718994140625, 0.9166259765625, 1.002532958984375, 1.08843994140625, 1.174346923828125, 1.26025390625, 1.346160888671875, 1.43206787109375, 1.517974853515625, 1.6038818359375, 1.689788818359375, 1.77569580078125, 1.861602783203125, 1.947509765625, 2.033416748046875, 2.11932373046875, 2.205230712890625, 2.2911376953125, 2.377044677734375, 2.46295166015625, 2.548858642578125, 2.634765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 10.0, 6.0, 7.0, 14.0, 27.0, 31.0, 28.0, 64.0, 101.0, 140.0, 228.0, 433.0, 790.0, 1623.0, 5990.0, 128712.0, 868723.0, 35362.0, 3428.0, 1331.0, 617.0, 317.0, 216.0, 92.0, 66.0, 43.0, 43.0, 33.0, 16.0, 12.0, 12.0, 6.0, 2.0, 6.0, 1.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.859375, -15.4105224609375, -14.961669921875, -14.5128173828125, -14.06396484375, -13.6151123046875, -13.166259765625, -12.7174072265625, -12.2685546875, -11.8197021484375, -11.370849609375, -10.9219970703125, -10.47314453125, -10.0242919921875, -9.575439453125, -9.1265869140625, -8.677734375, -8.2288818359375, -7.780029296875, -7.3311767578125, -6.88232421875, -6.4334716796875, -5.984619140625, -5.5357666015625, -5.0869140625, -4.6380615234375, -4.189208984375, -3.7403564453125, -3.29150390625, -2.8426513671875, -2.393798828125, -1.9449462890625, -1.49609375, -1.0472412109375, -0.598388671875, -0.1495361328125, 0.29931640625, 0.7481689453125, 1.197021484375, 1.6458740234375, 2.0947265625, 2.5435791015625, 2.992431640625, 3.4412841796875, 3.89013671875, 4.3389892578125, 4.787841796875, 5.2366943359375, 5.685546875, 6.1343994140625, 6.583251953125, 7.0321044921875, 7.48095703125, 7.9298095703125, 8.378662109375, 8.8275146484375, 9.2763671875, 9.7252197265625, 10.174072265625, 10.6229248046875, 11.07177734375, 11.5206298828125, 11.969482421875, 12.4183349609375, 12.8671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 13.0, 13.0, 21.0, 23.0, 39.0, 41.0, 53.0, 88.0, 80.0, 83.0, 98.0, 86.0, 84.0, 81.0, 46.0, 54.0, 34.0, 25.0, 17.0, 10.0, 7.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.0440673828125, -11.455322265625, -10.8665771484375, -10.27783203125, -9.6890869140625, -9.100341796875, -8.5115966796875, -7.9228515625, -7.3341064453125, -6.745361328125, -6.1566162109375, -5.56787109375, -4.9791259765625, -4.390380859375, -3.8016357421875, -3.212890625, -2.6241455078125, -2.035400390625, -1.4466552734375, -0.85791015625, -0.2691650390625, 0.319580078125, 0.9083251953125, 1.4970703125, 2.0858154296875, 2.674560546875, 3.2633056640625, 3.85205078125, 4.4407958984375, 5.029541015625, 5.6182861328125, 6.20703125, 6.7957763671875, 7.384521484375, 7.9732666015625, 8.56201171875, 9.1507568359375, 9.739501953125, 10.3282470703125, 10.9169921875, 11.5057373046875, 12.094482421875, 12.6832275390625, 13.27197265625, 13.8607177734375, 14.449462890625, 15.0382080078125, 15.626953125, 16.2156982421875, 16.804443359375, 17.3931884765625, 17.98193359375, 18.5706787109375, 19.159423828125, 19.7481689453125, 20.3369140625, 20.9256591796875, 21.514404296875, 22.1031494140625, 22.69189453125, 23.2806396484375, 23.869384765625, 24.4581298828125, 25.046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 1.0, 9.0, 12.0, 14.0, 16.0, 26.0, 61.0, 85.0, 170.0, 269.0, 650.0, 1624.0, 6469.0, 64376.0, 818949.0, 141705.0, 10342.0, 2223.0, 768.0, 323.0, 179.0, 99.0, 72.0, 32.0, 24.0, 15.0, 8.0, 4.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.35400390625, -6.1650390625, -5.97607421875, -5.787109375, -5.59814453125, -5.4091796875, -5.22021484375, -5.03125, -4.84228515625, -4.6533203125, -4.46435546875, -4.275390625, -4.08642578125, -3.8974609375, -3.70849609375, -3.51953125, -3.33056640625, -3.1416015625, -2.95263671875, -2.763671875, -2.57470703125, -2.3857421875, -2.19677734375, -2.0078125, -1.81884765625, -1.6298828125, -1.44091796875, -1.251953125, -1.06298828125, -0.8740234375, -0.68505859375, -0.49609375, -0.30712890625, -0.1181640625, 0.07080078125, 0.259765625, 0.44873046875, 0.6376953125, 0.82666015625, 1.015625, 1.20458984375, 1.3935546875, 1.58251953125, 1.771484375, 1.96044921875, 2.1494140625, 2.33837890625, 2.52734375, 2.71630859375, 2.9052734375, 3.09423828125, 3.283203125, 3.47216796875, 3.6611328125, 3.85009765625, 4.0390625, 4.22802734375, 4.4169921875, 4.60595703125, 4.794921875, 4.98388671875, 5.1728515625, 5.36181640625, 5.55078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 13.0, 13.0, 16.0, 26.0, 33.0, 45.0, 59.0, 73.0, 116.0, 118.0, 132.0, 90.0, 68.0, 51.0, 41.0, 28.0, 19.0, 8.0, 10.0, 10.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007238388061523438, -0.0007002800703048706, -0.0006767213344573975, -0.0006531625986099243, -0.0006296038627624512, -0.000606045126914978, -0.0005824863910675049, -0.0005589276552200317, -0.0005353689193725586, -0.0005118101835250854, -0.0004882514476776123, -0.00046469271183013916, -0.000441133975982666, -0.00041757524013519287, -0.0003940165042877197, -0.0003704577684402466, -0.00034689903259277344, -0.0003233402967453003, -0.00029978156089782715, -0.000276222825050354, -0.00025266408920288086, -0.00022910535335540771, -0.00020554661750793457, -0.00018198788166046143, -0.00015842914581298828, -0.00013487040996551514, -0.00011131167411804199, -8.775293827056885e-05, -6.41942024230957e-05, -4.063546657562256e-05, -1.7076730728149414e-05, 6.4820051193237305e-06, 3.0040740966796875e-05, 5.359947681427002e-05, 7.715821266174316e-05, 0.00010071694850921631, 0.00012427568435668945, 0.0001478344202041626, 0.00017139315605163574, 0.0001949518918991089, 0.00021851062774658203, 0.00024206936359405518, 0.0002656280994415283, 0.00028918683528900146, 0.0003127455711364746, 0.00033630430698394775, 0.0003598630428314209, 0.00038342177867889404, 0.0004069805145263672, 0.00043053925037384033, 0.0004540979862213135, 0.0004776567220687866, 0.0005012154579162598, 0.0005247741937637329, 0.0005483329296112061, 0.0005718916654586792, 0.0005954504013061523, 0.0006190091371536255, 0.0006425678730010986, 0.0006661266088485718, 0.0006896853446960449, 0.0007132440805435181, 0.0007368028163909912, 0.0007603615522384644, 0.0007839202880859375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 8.0, 17.0, 21.0, 48.0, 101.0, 177.0, 375.0, 1117.0, 5715.0, 216145.0, 808309.0, 13808.0, 1723.0, 513.0, 223.0, 100.0, 65.0, 35.0, 16.0, 8.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.046875, -7.750732421875, -7.45458984375, -7.158447265625, -6.8623046875, -6.566162109375, -6.27001953125, -5.973876953125, -5.677734375, -5.381591796875, -5.08544921875, -4.789306640625, -4.4931640625, -4.197021484375, -3.90087890625, -3.604736328125, -3.30859375, -3.012451171875, -2.71630859375, -2.420166015625, -2.1240234375, -1.827880859375, -1.53173828125, -1.235595703125, -0.939453125, -0.643310546875, -0.34716796875, -0.051025390625, 0.2451171875, 0.541259765625, 0.83740234375, 1.133544921875, 1.4296875, 1.725830078125, 2.02197265625, 2.318115234375, 2.6142578125, 2.910400390625, 3.20654296875, 3.502685546875, 3.798828125, 4.094970703125, 4.39111328125, 4.687255859375, 4.9833984375, 5.279541015625, 5.57568359375, 5.871826171875, 6.16796875, 6.464111328125, 6.76025390625, 7.056396484375, 7.3525390625, 7.648681640625, 7.94482421875, 8.240966796875, 8.537109375, 8.833251953125, 9.12939453125, 9.425537109375, 9.7216796875, 10.017822265625, 10.31396484375, 10.610107421875, 10.90625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 14.0, 14.0, 14.0, 27.0, 36.0, 46.0, 70.0, 107.0, 102.0, 109.0, 90.0, 109.0, 73.0, 54.0, 37.0, 27.0, 23.0, 7.0, 11.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.281097412109375, -3.13055419921875, -2.980010986328125, -2.8294677734375, -2.678924560546875, -2.52838134765625, -2.377838134765625, -2.227294921875, -2.076751708984375, -1.92620849609375, -1.775665283203125, -1.6251220703125, -1.474578857421875, -1.32403564453125, -1.173492431640625, -1.02294921875, -0.872406005859375, -0.72186279296875, -0.571319580078125, -0.4207763671875, -0.270233154296875, -0.11968994140625, 0.030853271484375, 0.181396484375, 0.331939697265625, 0.48248291015625, 0.633026123046875, 0.7835693359375, 0.934112548828125, 1.08465576171875, 1.235198974609375, 1.3857421875, 1.536285400390625, 1.68682861328125, 1.837371826171875, 1.9879150390625, 2.138458251953125, 2.28900146484375, 2.439544677734375, 2.590087890625, 2.740631103515625, 2.89117431640625, 3.041717529296875, 3.1922607421875, 3.342803955078125, 3.49334716796875, 3.643890380859375, 3.79443359375, 3.944976806640625, 4.09552001953125, 4.246063232421875, 4.3966064453125, 4.547149658203125, 4.69769287109375, 4.848236083984375, 4.998779296875, 5.149322509765625, 5.29986572265625, 5.450408935546875, 5.6009521484375, 5.751495361328125, 5.90203857421875, 6.052581787109375, 6.203125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 10.0, 22.0, 29.0, 85.0, 146.0, 202.0, 223.0, 153.0, 70.0, 33.0, 20.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.145263671875, -86.52996826171875, -83.91468048095703, -81.29938507080078, -78.68409729003906, -76.06880187988281, -73.4535140991211, -70.83821868896484, -68.22293090820312, -65.60763549804688, -62.992347717285156, -60.37705612182617, -57.76176452636719, -55.14646911621094, -52.53117752075195, -49.91588592529297, -47.30059051513672, -44.685298919677734, -42.07000732421875, -39.454715728759766, -36.83942413330078, -34.22412872314453, -31.608837127685547, -28.993545532226562, -26.378253936767578, -23.762962341308594, -21.14767074584961, -18.532377243041992, -15.917085647583008, -13.301794052124023, -10.686501502990723, -8.071208953857422, -5.455909729003906, -2.8406176567077637, -0.2253255844116211, 2.3899664878845215, 5.005258560180664, 7.620550155639648, 10.23584270477295, 12.85113525390625, 15.466426849365234, 18.08171844482422, 20.697010040283203, 23.31230354309082, 25.927595138549805, 28.54288673400879, 31.158180236816406, 33.77347183227539, 36.388763427734375, 39.00405502319336, 41.619346618652344, 44.23463821411133, 46.84992980957031, 49.46522521972656, 52.08051681518555, 54.69580841064453, 57.311100006103516, 59.9263916015625, 62.541683197021484, 65.15697479248047, 67.77227020263672, 70.38755798339844, 73.00285339355469, 75.61814880371094, 78.23343658447266]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 7.0, 11.0, 14.0, 15.0, 14.0, 22.0, 21.0, 26.0, 37.0, 32.0, 36.0, 34.0, 48.0, 42.0, 43.0, 50.0, 40.0, 59.0, 41.0, 44.0, 37.0, 45.0, 34.0, 21.0, 22.0, 32.0, 27.0, 28.0, 19.0, 9.0, 18.0, 16.0, 9.0, 4.0, 5.0, 8.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.62384033203125, -37.27640151977539, -35.9289665222168, -34.58152770996094, -33.234092712402344, -31.886653900146484, -30.539215087890625, -29.1917781829834, -27.844341278076172, -26.496904373168945, -25.14946746826172, -23.80202865600586, -22.454591751098633, -21.107154846191406, -19.759716033935547, -18.41227912902832, -17.064842224121094, -15.717405319213867, -14.369967460632324, -13.022529602050781, -11.675092697143555, -10.327655792236328, -8.980217933654785, -7.632780075073242, -6.285343170166016, -4.937905788421631, -3.590468406677246, -2.2430310249328613, -0.8955936431884766, 0.4518437385559082, 1.799281120300293, 3.146718978881836, 4.4941558837890625, 5.841593265533447, 7.189030647277832, 8.536468505859375, 9.883905410766602, 11.231342315673828, 12.578780174255371, 13.926218032836914, 15.27365493774414, 16.621091842651367, 17.968528747558594, 19.315967559814453, 20.66340446472168, 22.010841369628906, 23.358280181884766, 24.705717086791992, 26.05315399169922, 27.400590896606445, 28.748027801513672, 30.09546661376953, 31.442903518676758, 32.790340423583984, 34.137779235839844, 35.48521423339844, 36.8326530456543, 38.180091857910156, 39.52752685546875, 40.87496566772461, 42.22240447998047, 43.56983947753906, 44.91727828979492, 46.26471710205078, 47.612152099609375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 10.0, 6.0, 14.0, 26.0, 31.0, 48.0, 62.0, 106.0, 175.0, 276.0, 451.0, 798.0, 1371.0, 2582.0, 5880.0, 18738.0, 247592.0, 3877091.0, 25218.0, 7093.0, 2852.0, 1466.0, 962.0, 497.0, 347.0, 203.0, 123.0, 76.0, 48.0, 44.0, 35.0, 12.0, 6.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.9140625, -7.6595458984375, -7.405029296875, -7.1505126953125, -6.89599609375, -6.6414794921875, -6.386962890625, -6.1324462890625, -5.8779296875, -5.6234130859375, -5.368896484375, -5.1143798828125, -4.85986328125, -4.6053466796875, -4.350830078125, -4.0963134765625, -3.841796875, -3.5872802734375, -3.332763671875, -3.0782470703125, -2.82373046875, -2.5692138671875, -2.314697265625, -2.0601806640625, -1.8056640625, -1.5511474609375, -1.296630859375, -1.0421142578125, -0.78759765625, -0.5330810546875, -0.278564453125, -0.0240478515625, 0.23046875, 0.4849853515625, 0.739501953125, 0.9940185546875, 1.24853515625, 1.5030517578125, 1.757568359375, 2.0120849609375, 2.2666015625, 2.5211181640625, 2.775634765625, 3.0301513671875, 3.28466796875, 3.5391845703125, 3.793701171875, 4.0482177734375, 4.302734375, 4.5572509765625, 4.811767578125, 5.0662841796875, 5.32080078125, 5.5753173828125, 5.829833984375, 6.0843505859375, 6.3388671875, 6.5933837890625, 6.847900390625, 7.1024169921875, 7.35693359375, 7.6114501953125, 7.865966796875, 8.1204833984375, 8.375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 2.0, 9.0, 8.0, 12.0, 9.0, 11.0, 25.0, 22.0, 39.0, 29.0, 37.0, 51.0, 48.0, 55.0, 61.0, 73.0, 69.0, 53.0, 49.0, 46.0, 48.0, 36.0, 34.0, 36.0, 29.0, 20.0, 14.0, 18.0, 13.0, 11.0, 11.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-2.794921875, -2.717864990234375, -2.64080810546875, -2.563751220703125, -2.4866943359375, -2.409637451171875, -2.33258056640625, -2.255523681640625, -2.178466796875, -2.101409912109375, -2.02435302734375, -1.947296142578125, -1.8702392578125, -1.793182373046875, -1.71612548828125, -1.639068603515625, -1.56201171875, -1.484954833984375, -1.40789794921875, -1.330841064453125, -1.2537841796875, -1.176727294921875, -1.09967041015625, -1.022613525390625, -0.945556640625, -0.868499755859375, -0.79144287109375, -0.714385986328125, -0.6373291015625, -0.560272216796875, -0.48321533203125, -0.406158447265625, -0.3291015625, -0.252044677734375, -0.17498779296875, -0.097930908203125, -0.0208740234375, 0.056182861328125, 0.13323974609375, 0.210296630859375, 0.287353515625, 0.364410400390625, 0.44146728515625, 0.518524169921875, 0.5955810546875, 0.672637939453125, 0.74969482421875, 0.826751708984375, 0.90380859375, 0.980865478515625, 1.05792236328125, 1.134979248046875, 1.2120361328125, 1.289093017578125, 1.36614990234375, 1.443206787109375, 1.520263671875, 1.597320556640625, 1.67437744140625, 1.751434326171875, 1.8284912109375, 1.905548095703125, 1.98260498046875, 2.059661865234375, 2.13671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 11.0, 11.0, 8.0, 12.0, 15.0, 16.0, 33.0, 32.0, 72.0, 96.0, 104.0, 177.0, 184.0, 335.0, 477.0, 756.0, 1117.0, 1823.0, 3445.0, 6553.0, 14948.0, 45695.0, 614503.0, 3418901.0, 52283.0, 16332.0, 7136.0, 3574.0, 2008.0, 1209.0, 757.0, 525.0, 344.0, 230.0, 150.0, 119.0, 92.0, 58.0, 41.0, 28.0, 22.0, 15.0, 7.0, 10.0, 9.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.51171875, -4.36639404296875, -4.2210693359375, -4.07574462890625, -3.930419921875, -3.78509521484375, -3.6397705078125, -3.49444580078125, -3.34912109375, -3.20379638671875, -3.0584716796875, -2.91314697265625, -2.767822265625, -2.62249755859375, -2.4771728515625, -2.33184814453125, -2.1865234375, -2.04119873046875, -1.8958740234375, -1.75054931640625, -1.605224609375, -1.45989990234375, -1.3145751953125, -1.16925048828125, -1.02392578125, -0.87860107421875, -0.7332763671875, -0.58795166015625, -0.442626953125, -0.29730224609375, -0.1519775390625, -0.00665283203125, 0.138671875, 0.28399658203125, 0.4293212890625, 0.57464599609375, 0.719970703125, 0.86529541015625, 1.0106201171875, 1.15594482421875, 1.30126953125, 1.44659423828125, 1.5919189453125, 1.73724365234375, 1.882568359375, 2.02789306640625, 2.1732177734375, 2.31854248046875, 2.4638671875, 2.60919189453125, 2.7545166015625, 2.89984130859375, 3.045166015625, 3.19049072265625, 3.3358154296875, 3.48114013671875, 3.62646484375, 3.77178955078125, 3.9171142578125, 4.06243896484375, 4.207763671875, 4.35308837890625, 4.4984130859375, 4.64373779296875, 4.7890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 6.0, 12.0, 14.0, 29.0, 48.0, 90.0, 272.0, 3036.0, 254.0, 103.0, 57.0, 29.0, 16.0, 13.0, 12.0, 15.0, 8.0, 10.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.337890625, -1.3021621704101562, -1.2664337158203125, -1.2307052612304688, -1.194976806640625, -1.1592483520507812, -1.1235198974609375, -1.0877914428710938, -1.05206298828125, -1.0163345336914062, -0.9806060791015625, -0.9448776245117188, -0.909149169921875, -0.8734207153320312, -0.8376922607421875, -0.8019638061523438, -0.7662353515625, -0.7305068969726562, -0.6947784423828125, -0.6590499877929688, -0.623321533203125, -0.5875930786132812, -0.5518646240234375, -0.5161361694335938, -0.48040771484375, -0.44467926025390625, -0.4089508056640625, -0.37322235107421875, -0.337493896484375, -0.30176544189453125, -0.2660369873046875, -0.23030853271484375, -0.194580078125, -0.15885162353515625, -0.1231231689453125, -0.08739471435546875, -0.051666259765625, -0.01593780517578125, 0.0197906494140625, 0.05551910400390625, 0.09124755859375, 0.12697601318359375, 0.1627044677734375, 0.19843292236328125, 0.234161376953125, 0.26988983154296875, 0.3056182861328125, 0.34134674072265625, 0.3770751953125, 0.41280364990234375, 0.4485321044921875, 0.48426055908203125, 0.519989013671875, 0.5557174682617188, 0.5914459228515625, 0.6271743774414062, 0.66290283203125, 0.6986312866210938, 0.7343597412109375, 0.7700881958007812, 0.805816650390625, 0.8415451049804688, 0.8772735595703125, 0.9130020141601562, 0.94873046875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 5.0, 5.0, 4.0, 12.0, 15.0, 15.0, 30.0, 62.0, 95.0, 109.0, 114.0, 130.0, 111.0, 95.0, 70.0, 49.0, 21.0, 21.0, 15.0, 4.0, 4.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.431550979614258, -5.236156940460205, -5.0407633781433105, -4.845369338989258, -4.649975776672363, -4.4545817375183105, -4.259187698364258, -4.063794136047363, -3.8684003353118896, -3.673006534576416, -3.4776127338409424, -3.2822189331054688, -3.086824893951416, -2.8914313316345215, -2.6960372924804688, -2.500643491744995, -2.3052496910095215, -2.109855890274048, -1.9144620895385742, -1.719068169593811, -1.5236743688583374, -1.3282805681228638, -1.1328866481781006, -0.937492847442627, -0.7420990467071533, -0.5467052459716797, -0.3513113856315613, -0.15591752529144287, 0.03947627544403076, 0.2348700761795044, 0.4302639961242676, 0.6256577968597412, 0.8210515975952148, 1.0164453983306885, 1.211839199066162, 1.4072331190109253, 1.602626919746399, 1.7980207204818726, 1.9934146404266357, 2.1888084411621094, 2.384202241897583, 2.5795960426330566, 2.7749898433685303, 2.970383644104004, 3.1657776832580566, 3.361171245574951, 3.556565284729004, 3.7519590854644775, 3.947352886199951, 4.142746925354004, 4.338140487670898, 4.533534526824951, 4.728928089141846, 4.924322128295898, 5.119715690612793, 5.315109729766846, 5.510503768920898, 5.705897808074951, 5.901291370391846, 6.096685409545898, 6.292078971862793, 6.487473011016846, 6.682867050170898, 6.878260612487793, 7.0736541748046875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 10.0, 7.0, 11.0, 15.0, 16.0, 21.0, 20.0, 21.0, 28.0, 32.0, 29.0, 36.0, 35.0, 37.0, 30.0, 43.0, 41.0, 37.0, 33.0, 43.0, 41.0, 33.0, 41.0, 36.0, 47.0, 35.0, 24.0, 25.0, 30.0, 25.0, 11.0, 15.0, 12.0, 16.0, 9.0, 7.0, 8.0, 4.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.011662721633911, -2.924104928970337, -2.836547374725342, -2.7489895820617676, -2.6614320278167725, -2.5738742351531982, -2.486316680908203, -2.398758888244629, -2.311201333999634, -2.2236435413360596, -2.1360859870910645, -2.0485281944274902, -1.9609706401824951, -1.8734129667282104, -1.7858552932739258, -1.6982975006103516, -1.610739827156067, -1.5231821537017822, -1.4356244802474976, -1.348066806793213, -1.2605091333389282, -1.1729514598846436, -1.0853936672210693, -0.9978360533714294, -0.9102783799171448, -0.8227207064628601, -0.7351630330085754, -0.647605299949646, -0.5600476264953613, -0.47248998284339905, -0.384932279586792, -0.2973746061325073, -0.20981693267822266, -0.12225925177335739, -0.034701570868492126, 0.052856117486953735, 0.1404137909412384, 0.22797146439552307, 0.3155291676521301, 0.4030868411064148, 0.49064451456069946, 0.5782021880149841, 0.6657598614692688, 0.7533175945281982, 0.8408752679824829, 0.9284329414367676, 1.0159906148910522, 1.103548288345337, 1.1911059617996216, 1.2786636352539062, 1.366221308708191, 1.4537789821624756, 1.5413366556167603, 1.628894329071045, 1.7164521217346191, 1.8040096759796143, 1.8915674686431885, 1.9791251420974731, 2.066682815551758, 2.154240608215332, 2.241798162460327, 2.3293559551239014, 2.4169135093688965, 2.5044713020324707, 2.592028856277466]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 12.0, 17.0, 33.0, 60.0, 111.0, 225.0, 488.0, 1178.0, 3507.0, 11068.0, 39364.0, 148615.0, 443048.0, 289622.0, 80027.0, 21512.0, 6111.0, 2040.0, 821.0, 368.0, 152.0, 74.0, 43.0, 25.0, 11.0, 11.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.81640625, -4.65985107421875, -4.5032958984375, -4.34674072265625, -4.190185546875, -4.03363037109375, -3.8770751953125, -3.72052001953125, -3.56396484375, -3.40740966796875, -3.2508544921875, -3.09429931640625, -2.937744140625, -2.78118896484375, -2.6246337890625, -2.46807861328125, -2.3115234375, -2.15496826171875, -1.9984130859375, -1.84185791015625, -1.685302734375, -1.52874755859375, -1.3721923828125, -1.21563720703125, -1.05908203125, -0.90252685546875, -0.7459716796875, -0.58941650390625, -0.432861328125, -0.27630615234375, -0.1197509765625, 0.03680419921875, 0.193359375, 0.34991455078125, 0.5064697265625, 0.66302490234375, 0.819580078125, 0.97613525390625, 1.1326904296875, 1.28924560546875, 1.44580078125, 1.60235595703125, 1.7589111328125, 1.91546630859375, 2.072021484375, 2.22857666015625, 2.3851318359375, 2.54168701171875, 2.6982421875, 2.85479736328125, 3.0113525390625, 3.16790771484375, 3.324462890625, 3.48101806640625, 3.6375732421875, 3.79412841796875, 3.95068359375, 4.10723876953125, 4.2637939453125, 4.42034912109375, 4.576904296875, 4.73345947265625, 4.8900146484375, 5.04656982421875, 5.203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 9.0, 7.0, 12.0, 15.0, 23.0, 22.0, 34.0, 28.0, 24.0, 59.0, 61.0, 58.0, 61.0, 76.0, 68.0, 55.0, 64.0, 58.0, 67.0, 40.0, 26.0, 29.0, 20.0, 20.0, 20.0, 12.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0], "bins": [-3.3828125, -3.296051025390625, -3.20928955078125, -3.122528076171875, -3.0357666015625, -2.949005126953125, -2.86224365234375, -2.775482177734375, -2.688720703125, -2.601959228515625, -2.51519775390625, -2.428436279296875, -2.3416748046875, -2.254913330078125, -2.16815185546875, -2.081390380859375, -1.99462890625, -1.907867431640625, -1.82110595703125, -1.734344482421875, -1.6475830078125, -1.560821533203125, -1.47406005859375, -1.387298583984375, -1.300537109375, -1.213775634765625, -1.12701416015625, -1.040252685546875, -0.9534912109375, -0.866729736328125, -0.77996826171875, -0.693206787109375, -0.6064453125, -0.519683837890625, -0.43292236328125, -0.346160888671875, -0.2593994140625, -0.172637939453125, -0.08587646484375, 0.000885009765625, 0.087646484375, 0.174407958984375, 0.26116943359375, 0.347930908203125, 0.4346923828125, 0.521453857421875, 0.60821533203125, 0.694976806640625, 0.78173828125, 0.868499755859375, 0.95526123046875, 1.042022705078125, 1.1287841796875, 1.215545654296875, 1.30230712890625, 1.389068603515625, 1.475830078125, 1.562591552734375, 1.64935302734375, 1.736114501953125, 1.8228759765625, 1.909637451171875, 1.99639892578125, 2.083160400390625, 2.169921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 7.0, 10.0, 16.0, 32.0, 45.0, 81.0, 148.0, 225.0, 493.0, 1037.0, 3083.0, 54523.0, 954883.0, 29474.0, 2533.0, 973.0, 453.0, 227.0, 123.0, 69.0, 40.0, 22.0, 15.0, 16.0, 4.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -17.02197265625, -16.4970703125, -15.97216796875, -15.447265625, -14.92236328125, -14.3974609375, -13.87255859375, -13.34765625, -12.82275390625, -12.2978515625, -11.77294921875, -11.248046875, -10.72314453125, -10.1982421875, -9.67333984375, -9.1484375, -8.62353515625, -8.0986328125, -7.57373046875, -7.048828125, -6.52392578125, -5.9990234375, -5.47412109375, -4.94921875, -4.42431640625, -3.8994140625, -3.37451171875, -2.849609375, -2.32470703125, -1.7998046875, -1.27490234375, -0.75, -0.22509765625, 0.2998046875, 0.82470703125, 1.349609375, 1.87451171875, 2.3994140625, 2.92431640625, 3.44921875, 3.97412109375, 4.4990234375, 5.02392578125, 5.548828125, 6.07373046875, 6.5986328125, 7.12353515625, 7.6484375, 8.17333984375, 8.6982421875, 9.22314453125, 9.748046875, 10.27294921875, 10.7978515625, 11.32275390625, 11.84765625, 12.37255859375, 12.8974609375, 13.42236328125, 13.947265625, 14.47216796875, 14.9970703125, 15.52197265625, 16.046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 10.0, 9.0, 5.0, 13.0, 14.0, 17.0, 21.0, 38.0, 37.0, 45.0, 43.0, 64.0, 65.0, 61.0, 74.0, 59.0, 56.0, 78.0, 52.0, 53.0, 34.0, 33.0, 29.0, 21.0, 22.0, 10.0, 9.0, 9.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0234375, -13.5633544921875, -13.103271484375, -12.6431884765625, -12.18310546875, -11.7230224609375, -11.262939453125, -10.8028564453125, -10.3427734375, -9.8826904296875, -9.422607421875, -8.9625244140625, -8.50244140625, -8.0423583984375, -7.582275390625, -7.1221923828125, -6.662109375, -6.2020263671875, -5.741943359375, -5.2818603515625, -4.82177734375, -4.3616943359375, -3.901611328125, -3.4415283203125, -2.9814453125, -2.5213623046875, -2.061279296875, -1.6011962890625, -1.14111328125, -0.6810302734375, -0.220947265625, 0.2391357421875, 0.69921875, 1.1593017578125, 1.619384765625, 2.0794677734375, 2.53955078125, 2.9996337890625, 3.459716796875, 3.9197998046875, 4.3798828125, 4.8399658203125, 5.300048828125, 5.7601318359375, 6.22021484375, 6.6802978515625, 7.140380859375, 7.6004638671875, 8.060546875, 8.5206298828125, 8.980712890625, 9.4407958984375, 9.90087890625, 10.3609619140625, 10.821044921875, 11.2811279296875, 11.7412109375, 12.2012939453125, 12.661376953125, 13.1214599609375, 13.58154296875, 14.0416259765625, 14.501708984375, 14.9617919921875, 15.421875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 12.0, 10.0, 10.0, 17.0, 21.0, 38.0, 60.0, 92.0, 180.0, 389.0, 1036.0, 5937.0, 301634.0, 727314.0, 9500.0, 1324.0, 468.0, 192.0, 107.0, 68.0, 43.0, 29.0, 22.0, 22.0, 4.0, 12.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.4080810546875, -8.128662109375, -7.8492431640625, -7.56982421875, -7.2904052734375, -7.010986328125, -6.7315673828125, -6.4521484375, -6.1727294921875, -5.893310546875, -5.6138916015625, -5.33447265625, -5.0550537109375, -4.775634765625, -4.4962158203125, -4.216796875, -3.9373779296875, -3.657958984375, -3.3785400390625, -3.09912109375, -2.8197021484375, -2.540283203125, -2.2608642578125, -1.9814453125, -1.7020263671875, -1.422607421875, -1.1431884765625, -0.86376953125, -0.5843505859375, -0.304931640625, -0.0255126953125, 0.25390625, 0.5333251953125, 0.812744140625, 1.0921630859375, 1.37158203125, 1.6510009765625, 1.930419921875, 2.2098388671875, 2.4892578125, 2.7686767578125, 3.048095703125, 3.3275146484375, 3.60693359375, 3.8863525390625, 4.165771484375, 4.4451904296875, 4.724609375, 5.0040283203125, 5.283447265625, 5.5628662109375, 5.84228515625, 6.1217041015625, 6.401123046875, 6.6805419921875, 6.9599609375, 7.2393798828125, 7.518798828125, 7.7982177734375, 8.07763671875, 8.3570556640625, 8.636474609375, 8.9158935546875, 9.1953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 5.0, 7.0, 5.0, 4.0, 7.0, 7.0, 10.0, 9.0, 18.0, 27.0, 27.0, 34.0, 49.0, 60.0, 73.0, 74.0, 89.0, 99.0, 80.0, 70.0, 49.0, 44.0, 21.0, 35.0, 14.0, 15.0, 11.0, 12.0, 14.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005006790161132812, -0.00048555806279182434, -0.00047043710947036743, -0.0004553161561489105, -0.0004401952028274536, -0.0004250742495059967, -0.0004099532961845398, -0.0003948323428630829, -0.000379711389541626, -0.00036459043622016907, -0.00034946948289871216, -0.00033434852957725525, -0.00031922757625579834, -0.00030410662293434143, -0.0002889856696128845, -0.0002738647162914276, -0.0002587437629699707, -0.0002436228096485138, -0.00022850185632705688, -0.00021338090300559998, -0.00019825994968414307, -0.00018313899636268616, -0.00016801804304122925, -0.00015289708971977234, -0.00013777613639831543, -0.00012265518307685852, -0.00010753422975540161, -9.24132764339447e-05, -7.729232311248779e-05, -6.217136979103088e-05, -4.7050416469573975e-05, -3.1929463148117065e-05, -1.6808509826660156e-05, -1.687556505203247e-06, 1.3433396816253662e-05, 2.855435013771057e-05, 4.367530345916748e-05, 5.879625678062439e-05, 7.39172101020813e-05, 8.903816342353821e-05, 0.00010415911674499512, 0.00011928007006645203, 0.00013440102338790894, 0.00014952197670936584, 0.00016464293003082275, 0.00017976388335227966, 0.00019488483667373657, 0.00021000578999519348, 0.0002251267433166504, 0.0002402476966381073, 0.0002553686499595642, 0.0002704896032810211, 0.00028561055660247803, 0.00030073150992393494, 0.00031585246324539185, 0.00033097341656684875, 0.00034609436988830566, 0.0003612153232097626, 0.0003763362765312195, 0.0003914572298526764, 0.0004065781831741333, 0.0004216991364955902, 0.0004368200898170471, 0.00045194104313850403, 0.00046706199645996094]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 4.0, 7.0, 7.0, 9.0, 17.0, 14.0, 25.0, 45.0, 53.0, 104.0, 162.0, 309.0, 586.0, 1238.0, 3545.0, 17374.0, 294132.0, 686481.0, 35786.0, 5338.0, 1693.0, 712.0, 378.0, 193.0, 106.0, 71.0, 39.0, 31.0, 19.0, 18.0, 16.0, 11.0, 4.0, 10.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.09283447265625, -4.9239501953125, -4.75506591796875, -4.586181640625, -4.41729736328125, -4.2484130859375, -4.07952880859375, -3.91064453125, -3.74176025390625, -3.5728759765625, -3.40399169921875, -3.235107421875, -3.06622314453125, -2.8973388671875, -2.72845458984375, -2.5595703125, -2.39068603515625, -2.2218017578125, -2.05291748046875, -1.884033203125, -1.71514892578125, -1.5462646484375, -1.37738037109375, -1.20849609375, -1.03961181640625, -0.8707275390625, -0.70184326171875, -0.532958984375, -0.36407470703125, -0.1951904296875, -0.02630615234375, 0.142578125, 0.31146240234375, 0.4803466796875, 0.64923095703125, 0.818115234375, 0.98699951171875, 1.1558837890625, 1.32476806640625, 1.49365234375, 1.66253662109375, 1.8314208984375, 2.00030517578125, 2.169189453125, 2.33807373046875, 2.5069580078125, 2.67584228515625, 2.8447265625, 3.01361083984375, 3.1824951171875, 3.35137939453125, 3.520263671875, 3.68914794921875, 3.8580322265625, 4.02691650390625, 4.19580078125, 4.36468505859375, 4.5335693359375, 4.70245361328125, 4.871337890625, 5.04022216796875, 5.2091064453125, 5.37799072265625, 5.546875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 6.0, 10.0, 13.0, 12.0, 28.0, 37.0, 48.0, 73.0, 91.0, 124.0, 125.0, 111.0, 86.0, 64.0, 54.0, 27.0, 28.0, 9.0, 18.0, 12.0, 8.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.78094482421875, -4.6243896484375, -4.46783447265625, -4.311279296875, -4.15472412109375, -3.9981689453125, -3.84161376953125, -3.68505859375, -3.52850341796875, -3.3719482421875, -3.21539306640625, -3.058837890625, -2.90228271484375, -2.7457275390625, -2.58917236328125, -2.4326171875, -2.27606201171875, -2.1195068359375, -1.96295166015625, -1.806396484375, -1.64984130859375, -1.4932861328125, -1.33673095703125, -1.18017578125, -1.02362060546875, -0.8670654296875, -0.71051025390625, -0.553955078125, -0.39739990234375, -0.2408447265625, -0.08428955078125, 0.072265625, 0.22882080078125, 0.3853759765625, 0.54193115234375, 0.698486328125, 0.85504150390625, 1.0115966796875, 1.16815185546875, 1.32470703125, 1.48126220703125, 1.6378173828125, 1.79437255859375, 1.950927734375, 2.10748291015625, 2.2640380859375, 2.42059326171875, 2.5771484375, 2.73370361328125, 2.8902587890625, 3.04681396484375, 3.203369140625, 3.35992431640625, 3.5164794921875, 3.67303466796875, 3.82958984375, 3.98614501953125, 4.1427001953125, 4.29925537109375, 4.455810546875, 4.61236572265625, 4.7689208984375, 4.92547607421875, 5.08203125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 8.0, 43.0, 290.0, 541.0, 104.0, 12.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.3489990234375, -149.616943359375, -142.88487243652344, -136.15281677246094, -129.42076110839844, -122.6886978149414, -115.95663452148438, -109.22457885742188, -102.49252319335938, -95.76045989990234, -89.02840423583984, -82.29634094238281, -75.56428527832031, -68.83222198486328, -62.100162506103516, -55.36810302734375, -48.63603973388672, -41.90398025512695, -35.17192077636719, -28.43985939025879, -21.707799911499023, -14.975738525390625, -8.24367904663086, -1.5116195678710938, 5.220439910888672, 11.952499389648438, 18.684558868408203, 25.4166202545166, 32.148681640625, 38.880741119384766, 45.61280059814453, 52.3448600769043, 59.07691955566406, 65.8089828491211, 72.5410385131836, 79.27310180664062, 86.00515747070312, 92.73722076416016, 99.46928405761719, 106.20133972167969, 112.93339538574219, 119.66545867919922, 126.39751434326172, 133.12957763671875, 139.86163330078125, 146.59368896484375, 153.3257598876953, 160.0578155517578, 166.78988647460938, 173.52194213867188, 180.25401306152344, 186.98606872558594, 193.71812438964844, 200.4501953125, 207.1822509765625, 213.914306640625, 220.6463623046875, 227.37841796875, 234.11048889160156, 240.84254455566406, 247.57460021972656, 254.30667114257812, 261.0387268066406, 267.7707824707031, 274.5028381347656]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 5.0, 10.0, 7.0, 4.0, 7.0, 13.0, 9.0, 18.0, 18.0, 24.0, 18.0, 22.0, 35.0, 37.0, 38.0, 36.0, 45.0, 42.0, 37.0, 51.0, 59.0, 42.0, 49.0, 46.0, 45.0, 41.0, 31.0, 17.0, 30.0, 29.0, 20.0, 20.0, 15.0, 13.0, 16.0, 10.0, 7.0, 11.0, 6.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.7602653503418, -37.44147872924805, -36.12268829345703, -34.80390167236328, -33.48511505126953, -32.16632843017578, -30.8475399017334, -29.528751373291016, -28.209964752197266, -26.891178131103516, -25.572389602661133, -24.25360107421875, -22.934814453125, -21.61602783203125, -20.297239303588867, -18.978450775146484, -17.659664154052734, -16.340877532958984, -15.022089004516602, -13.703301429748535, -12.384513854980469, -11.065726280212402, -9.746938705444336, -8.42815113067627, -7.109363555908203, -5.790575981140137, -4.47178840637207, -3.153000831604004, -1.8342132568359375, -0.5154256820678711, 0.8033618927001953, 2.1221494674682617, 3.4409332275390625, 4.759720802307129, 6.078508377075195, 7.397295951843262, 8.716083526611328, 10.034871101379395, 11.353658676147461, 12.672446250915527, 13.991233825683594, 15.31002140045166, 16.628808975219727, 17.94759750366211, 19.26638412475586, 20.58517074584961, 21.903959274291992, 23.222747802734375, 24.541534423828125, 25.860321044921875, 27.179109573364258, 28.49789810180664, 29.81668472290039, 31.13547134399414, 32.454261779785156, 33.773048400878906, 35.091835021972656, 36.410621643066406, 37.729408264160156, 39.04819869995117, 40.36698532104492, 41.68577194213867, 43.00456237792969, 44.32334899902344, 45.64213562011719]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 11.0, 9.0, 7.0, 14.0, 15.0, 27.0, 49.0, 64.0, 94.0, 156.0, 246.0, 431.0, 694.0, 1219.0, 2318.0, 4738.0, 11336.0, 37686.0, 372872.0, 3669321.0, 63896.0, 16180.0, 6224.0, 2831.0, 1588.0, 825.0, 533.0, 317.0, 189.0, 102.0, 89.0, 59.0, 36.0, 33.0, 17.0, 17.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.24609375, -5.0777587890625, -4.909423828125, -4.7410888671875, -4.57275390625, -4.4044189453125, -4.236083984375, -4.0677490234375, -3.8994140625, -3.7310791015625, -3.562744140625, -3.3944091796875, -3.22607421875, -3.0577392578125, -2.889404296875, -2.7210693359375, -2.552734375, -2.3843994140625, -2.216064453125, -2.0477294921875, -1.87939453125, -1.7110595703125, -1.542724609375, -1.3743896484375, -1.2060546875, -1.0377197265625, -0.869384765625, -0.7010498046875, -0.53271484375, -0.3643798828125, -0.196044921875, -0.0277099609375, 0.140625, 0.3089599609375, 0.477294921875, 0.6456298828125, 0.81396484375, 0.9822998046875, 1.150634765625, 1.3189697265625, 1.4873046875, 1.6556396484375, 1.823974609375, 1.9923095703125, 2.16064453125, 2.3289794921875, 2.497314453125, 2.6656494140625, 2.833984375, 3.0023193359375, 3.170654296875, 3.3389892578125, 3.50732421875, 3.6756591796875, 3.843994140625, 4.0123291015625, 4.1806640625, 4.3489990234375, 4.517333984375, 4.6856689453125, 4.85400390625, 5.0223388671875, 5.190673828125, 5.3590087890625, 5.52734375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 7.0, 11.0, 7.0, 13.0, 15.0, 19.0, 17.0, 26.0, 37.0, 38.0, 37.0, 43.0, 47.0, 41.0, 57.0, 57.0, 66.0, 40.0, 49.0, 40.0, 43.0, 44.0, 37.0, 31.0, 29.0, 32.0, 15.0, 17.0, 20.0, 10.0, 12.0, 7.0, 7.0, 6.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.8128662109375, -1.746826171875, -1.6807861328125, -1.61474609375, -1.5487060546875, -1.482666015625, -1.4166259765625, -1.3505859375, -1.2845458984375, -1.218505859375, -1.1524658203125, -1.08642578125, -1.0203857421875, -0.954345703125, -0.8883056640625, -0.822265625, -0.7562255859375, -0.690185546875, -0.6241455078125, -0.55810546875, -0.4920654296875, -0.426025390625, -0.3599853515625, -0.2939453125, -0.2279052734375, -0.161865234375, -0.0958251953125, -0.02978515625, 0.0362548828125, 0.102294921875, 0.1683349609375, 0.234375, 0.3004150390625, 0.366455078125, 0.4324951171875, 0.49853515625, 0.5645751953125, 0.630615234375, 0.6966552734375, 0.7626953125, 0.8287353515625, 0.894775390625, 0.9608154296875, 1.02685546875, 1.0928955078125, 1.158935546875, 1.2249755859375, 1.291015625, 1.3570556640625, 1.423095703125, 1.4891357421875, 1.55517578125, 1.6212158203125, 1.687255859375, 1.7532958984375, 1.8193359375, 1.8853759765625, 1.951416015625, 2.0174560546875, 2.08349609375, 2.1495361328125, 2.215576171875, 2.2816162109375, 2.34765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 12.0, 22.0, 15.0, 34.0, 32.0, 56.0, 64.0, 100.0, 131.0, 241.0, 362.0, 636.0, 1211.0, 2452.0, 5625.0, 15239.0, 58781.0, 1165166.0, 2851739.0, 64731.0, 16257.0, 5820.0, 2469.0, 1245.0, 678.0, 386.0, 245.0, 144.0, 109.0, 68.0, 58.0, 41.0, 37.0, 21.0, 12.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.6199951171875, -5.454833984375, -5.2896728515625, -5.12451171875, -4.9593505859375, -4.794189453125, -4.6290283203125, -4.4638671875, -4.2987060546875, -4.133544921875, -3.9683837890625, -3.80322265625, -3.6380615234375, -3.472900390625, -3.3077392578125, -3.142578125, -2.9774169921875, -2.812255859375, -2.6470947265625, -2.48193359375, -2.3167724609375, -2.151611328125, -1.9864501953125, -1.8212890625, -1.6561279296875, -1.490966796875, -1.3258056640625, -1.16064453125, -0.9954833984375, -0.830322265625, -0.6651611328125, -0.5, -0.3348388671875, -0.169677734375, -0.0045166015625, 0.16064453125, 0.3258056640625, 0.490966796875, 0.6561279296875, 0.8212890625, 0.9864501953125, 1.151611328125, 1.3167724609375, 1.48193359375, 1.6470947265625, 1.812255859375, 1.9774169921875, 2.142578125, 2.3077392578125, 2.472900390625, 2.6380615234375, 2.80322265625, 2.9683837890625, 3.133544921875, 3.2987060546875, 3.4638671875, 3.6290283203125, 3.794189453125, 3.9593505859375, 4.12451171875, 4.2896728515625, 4.454833984375, 4.6199951171875, 4.78515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 12.0, 17.0, 13.0, 24.0, 40.0, 53.0, 100.0, 235.0, 1924.0, 1179.0, 204.0, 98.0, 49.0, 41.0, 19.0, 13.0, 11.0, 9.0, 7.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.943634033203125, -1.86578369140625, -1.787933349609375, -1.7100830078125, -1.632232666015625, -1.55438232421875, -1.476531982421875, -1.398681640625, -1.320831298828125, -1.24298095703125, -1.165130615234375, -1.0872802734375, -1.009429931640625, -0.93157958984375, -0.853729248046875, -0.77587890625, -0.698028564453125, -0.62017822265625, -0.542327880859375, -0.4644775390625, -0.386627197265625, -0.30877685546875, -0.230926513671875, -0.153076171875, -0.075225830078125, 0.00262451171875, 0.080474853515625, 0.1583251953125, 0.236175537109375, 0.31402587890625, 0.391876220703125, 0.4697265625, 0.547576904296875, 0.62542724609375, 0.703277587890625, 0.7811279296875, 0.858978271484375, 0.93682861328125, 1.014678955078125, 1.092529296875, 1.170379638671875, 1.24822998046875, 1.326080322265625, 1.4039306640625, 1.481781005859375, 1.55963134765625, 1.637481689453125, 1.71533203125, 1.793182373046875, 1.87103271484375, 1.948883056640625, 2.0267333984375, 2.104583740234375, 2.18243408203125, 2.260284423828125, 2.338134765625, 2.415985107421875, 2.49383544921875, 2.571685791015625, 2.6495361328125, 2.727386474609375, 2.80523681640625, 2.883087158203125, 2.9609375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 10.0, 15.0, 26.0, 59.0, 80.0, 106.0, 153.0, 146.0, 120.0, 93.0, 71.0, 52.0, 35.0, 12.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.10651969909668, -16.661672592163086, -16.216827392578125, -15.771980285644531, -15.327133178710938, -14.88228702545166, -14.437440872192383, -13.992593765258789, -13.547746658325195, -13.102900505065918, -12.658053398132324, -12.213207244873047, -11.768360137939453, -11.323513984680176, -10.878667831420898, -10.433820724487305, -9.988974571228027, -9.54412841796875, -9.099281311035156, -8.654435157775879, -8.209588050842285, -7.764741897583008, -7.319895267486572, -6.875048637390137, -6.430202007293701, -5.985355377197266, -5.54050874710083, -5.0956621170043945, -4.650815963745117, -4.205968856811523, -3.761122703552246, -3.3162760734558105, -2.8714303970336914, -2.426583766937256, -1.9817372560501099, -1.5368907451629639, -1.0920441150665283, -0.6471974849700928, -0.20235109329223633, 0.24249553680419922, 0.6873421669006348, 1.1321887969970703, 1.5770353078842163, 2.0218818187713623, 2.466728448867798, 2.9115750789642334, 3.35642147064209, 3.8012681007385254, 4.246114730834961, 4.6909613609313965, 5.135807991027832, 5.580654144287109, 6.025501251220703, 6.4703474044799805, 6.915194034576416, 7.360040664672852, 7.804887294769287, 8.249733924865723, 8.694580078125, 9.139427185058594, 9.584273338317871, 10.029120445251465, 10.473966598510742, 10.918813705444336, 11.363659858703613]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 7.0, 7.0, 6.0, 7.0, 7.0, 13.0, 15.0, 20.0, 21.0, 15.0, 27.0, 23.0, 30.0, 31.0, 24.0, 34.0, 46.0, 45.0, 49.0, 40.0, 37.0, 60.0, 36.0, 35.0, 39.0, 35.0, 51.0, 33.0, 25.0, 22.0, 26.0, 22.0, 18.0, 9.0, 17.0, 7.0, 7.0, 14.0, 6.0, 3.0, 9.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.914201736450195, -5.727599143981934, -5.540996074676514, -5.354393482208252, -5.167790412902832, -4.98118782043457, -4.794585227966309, -4.607982158660889, -4.421379566192627, -4.234776973724365, -4.048173904418945, -3.8615713119506836, -3.6749684810638428, -3.488365650177002, -3.301762819290161, -3.1151599884033203, -2.9285571575164795, -2.7419543266296387, -2.555351495742798, -2.368748664855957, -2.1821460723876953, -1.9955432415008545, -1.8089404106140137, -1.6223376989364624, -1.4357348680496216, -1.2491320371627808, -1.0625293254852295, -0.8759264945983887, -0.6893237233161926, -0.5027209520339966, -0.31611812114715576, -0.1295154094696045, 0.05708742141723633, 0.24369020760059357, 0.4302929937839508, 0.6168957948684692, 0.8034985661506653, 0.9901013374328613, 1.1767041683197021, 1.3633068799972534, 1.5499097108840942, 1.736512541770935, 1.9231152534484863, 2.109718084335327, 2.296320915222168, 2.4829235076904297, 2.6695265769958496, 2.8561291694641113, 3.042732000350952, 3.229334831237793, 3.415937662124634, 3.6025404930114746, 3.7891430854797363, 3.975745916366577, 4.162348747253418, 4.34895133972168, 4.5355544090271, 4.722157001495361, 4.908760070800781, 5.095362663269043, 5.281965732574463, 5.468568325042725, 5.6551713943481445, 5.841773986816406, 6.028376579284668]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 9.0, 8.0, 15.0, 36.0, 67.0, 115.0, 251.0, 566.0, 1425.0, 4183.0, 14149.0, 54750.0, 225226.0, 540587.0, 153565.0, 38338.0, 10226.0, 3095.0, 1104.0, 448.0, 207.0, 79.0, 43.0, 24.0, 13.0, 12.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0546875, -5.8250732421875, -5.595458984375, -5.3658447265625, -5.13623046875, -4.9066162109375, -4.677001953125, -4.4473876953125, -4.2177734375, -3.9881591796875, -3.758544921875, -3.5289306640625, -3.29931640625, -3.0697021484375, -2.840087890625, -2.6104736328125, -2.380859375, -2.1512451171875, -1.921630859375, -1.6920166015625, -1.46240234375, -1.2327880859375, -1.003173828125, -0.7735595703125, -0.5439453125, -0.3143310546875, -0.084716796875, 0.1448974609375, 0.37451171875, 0.6041259765625, 0.833740234375, 1.0633544921875, 1.29296875, 1.5225830078125, 1.752197265625, 1.9818115234375, 2.21142578125, 2.4410400390625, 2.670654296875, 2.9002685546875, 3.1298828125, 3.3594970703125, 3.589111328125, 3.8187255859375, 4.04833984375, 4.2779541015625, 4.507568359375, 4.7371826171875, 4.966796875, 5.1964111328125, 5.426025390625, 5.6556396484375, 5.88525390625, 6.1148681640625, 6.344482421875, 6.5740966796875, 6.8037109375, 7.0333251953125, 7.262939453125, 7.4925537109375, 7.72216796875, 7.9517822265625, 8.181396484375, 8.4110107421875, 8.640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 10.0, 10.0, 10.0, 15.0, 12.0, 13.0, 23.0, 29.0, 39.0, 44.0, 39.0, 39.0, 66.0, 50.0, 53.0, 43.0, 55.0, 64.0, 41.0, 60.0, 45.0, 35.0, 28.0, 26.0, 21.0, 20.0, 32.0, 11.0, 12.0, 10.0, 12.0, 3.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.3984375, -2.327178955078125, -2.25592041015625, -2.184661865234375, -2.1134033203125, -2.042144775390625, -1.97088623046875, -1.899627685546875, -1.828369140625, -1.757110595703125, -1.68585205078125, -1.614593505859375, -1.5433349609375, -1.472076416015625, -1.40081787109375, -1.329559326171875, -1.25830078125, -1.187042236328125, -1.11578369140625, -1.044525146484375, -0.9732666015625, -0.902008056640625, -0.83074951171875, -0.759490966796875, -0.688232421875, -0.616973876953125, -0.54571533203125, -0.474456787109375, -0.4031982421875, -0.331939697265625, -0.26068115234375, -0.189422607421875, -0.1181640625, -0.046905517578125, 0.02435302734375, 0.095611572265625, 0.1668701171875, 0.238128662109375, 0.30938720703125, 0.380645751953125, 0.451904296875, 0.523162841796875, 0.59442138671875, 0.665679931640625, 0.7369384765625, 0.808197021484375, 0.87945556640625, 0.950714111328125, 1.02197265625, 1.093231201171875, 1.16448974609375, 1.235748291015625, 1.3070068359375, 1.378265380859375, 1.44952392578125, 1.520782470703125, 1.592041015625, 1.663299560546875, 1.73455810546875, 1.805816650390625, 1.8770751953125, 1.948333740234375, 2.01959228515625, 2.090850830078125, 2.162109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 5.0, 5.0, 7.0, 9.0, 8.0, 10.0, 20.0, 18.0, 27.0, 44.0, 46.0, 54.0, 87.0, 128.0, 185.0, 293.0, 545.0, 988.0, 2039.0, 6260.0, 50315.0, 788764.0, 179243.0, 13246.0, 3093.0, 1251.0, 643.0, 397.0, 228.0, 160.0, 102.0, 74.0, 52.0, 38.0, 25.0, 40.0, 26.0, 14.0, 20.0, 10.0, 10.0, 3.0, 6.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-12.375, -11.9847412109375, -11.594482421875, -11.2042236328125, -10.81396484375, -10.4237060546875, -10.033447265625, -9.6431884765625, -9.2529296875, -8.8626708984375, -8.472412109375, -8.0821533203125, -7.69189453125, -7.3016357421875, -6.911376953125, -6.5211181640625, -6.130859375, -5.7406005859375, -5.350341796875, -4.9600830078125, -4.56982421875, -4.1795654296875, -3.789306640625, -3.3990478515625, -3.0087890625, -2.6185302734375, -2.228271484375, -1.8380126953125, -1.44775390625, -1.0574951171875, -0.667236328125, -0.2769775390625, 0.11328125, 0.5035400390625, 0.893798828125, 1.2840576171875, 1.67431640625, 2.0645751953125, 2.454833984375, 2.8450927734375, 3.2353515625, 3.6256103515625, 4.015869140625, 4.4061279296875, 4.79638671875, 5.1866455078125, 5.576904296875, 5.9671630859375, 6.357421875, 6.7476806640625, 7.137939453125, 7.5281982421875, 7.91845703125, 8.3087158203125, 8.698974609375, 9.0892333984375, 9.4794921875, 9.8697509765625, 10.260009765625, 10.6502685546875, 11.04052734375, 11.4307861328125, 11.821044921875, 12.2113037109375, 12.6015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 9.0, 9.0, 16.0, 23.0, 21.0, 39.0, 49.0, 55.0, 54.0, 68.0, 63.0, 82.0, 78.0, 57.0, 71.0, 69.0, 54.0, 46.0, 38.0, 16.0, 20.0, 22.0, 11.0, 9.0, 8.0, 5.0, 7.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.53125, -14.064697265625, -13.59814453125, -13.131591796875, -12.6650390625, -12.198486328125, -11.73193359375, -11.265380859375, -10.798828125, -10.332275390625, -9.86572265625, -9.399169921875, -8.9326171875, -8.466064453125, -7.99951171875, -7.532958984375, -7.06640625, -6.599853515625, -6.13330078125, -5.666748046875, -5.2001953125, -4.733642578125, -4.26708984375, -3.800537109375, -3.333984375, -2.867431640625, -2.40087890625, -1.934326171875, -1.4677734375, -1.001220703125, -0.53466796875, -0.068115234375, 0.3984375, 0.864990234375, 1.33154296875, 1.798095703125, 2.2646484375, 2.731201171875, 3.19775390625, 3.664306640625, 4.130859375, 4.597412109375, 5.06396484375, 5.530517578125, 5.9970703125, 6.463623046875, 6.93017578125, 7.396728515625, 7.86328125, 8.329833984375, 8.79638671875, 9.262939453125, 9.7294921875, 10.196044921875, 10.66259765625, 11.129150390625, 11.595703125, 12.062255859375, 12.52880859375, 12.995361328125, 13.4619140625, 13.928466796875, 14.39501953125, 14.861572265625, 15.328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 17.0, 26.0, 33.0, 49.0, 64.0, 102.0, 171.0, 309.0, 580.0, 1160.0, 3123.0, 9663.0, 40743.0, 278304.0, 613112.0, 77547.0, 15494.0, 4568.0, 1700.0, 772.0, 396.0, 205.0, 121.0, 81.0, 62.0, 37.0, 28.0, 14.0, 8.0, 8.0, 8.0, 8.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.908203125, -3.797119140625, -3.68603515625, -3.574951171875, -3.4638671875, -3.352783203125, -3.24169921875, -3.130615234375, -3.01953125, -2.908447265625, -2.79736328125, -2.686279296875, -2.5751953125, -2.464111328125, -2.35302734375, -2.241943359375, -2.130859375, -2.019775390625, -1.90869140625, -1.797607421875, -1.6865234375, -1.575439453125, -1.46435546875, -1.353271484375, -1.2421875, -1.131103515625, -1.02001953125, -0.908935546875, -0.7978515625, -0.686767578125, -0.57568359375, -0.464599609375, -0.353515625, -0.242431640625, -0.13134765625, -0.020263671875, 0.0908203125, 0.201904296875, 0.31298828125, 0.424072265625, 0.53515625, 0.646240234375, 0.75732421875, 0.868408203125, 0.9794921875, 1.090576171875, 1.20166015625, 1.312744140625, 1.423828125, 1.534912109375, 1.64599609375, 1.757080078125, 1.8681640625, 1.979248046875, 2.09033203125, 2.201416015625, 2.3125, 2.423583984375, 2.53466796875, 2.645751953125, 2.7568359375, 2.867919921875, 2.97900390625, 3.090087890625, 3.201171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 10.0, 7.0, 11.0, 16.0, 31.0, 31.0, 35.0, 53.0, 56.0, 59.0, 134.0, 194.0, 100.0, 44.0, 45.0, 47.0, 30.0, 23.0, 25.0, 16.0, 14.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008940696716308594, -0.0008623376488685608, -0.0008306056261062622, -0.0007988736033439636, -0.000767141580581665, -0.0007354095578193665, -0.0007036775350570679, -0.0006719455122947693, -0.0006402134895324707, -0.0006084814667701721, -0.0005767494440078735, -0.000545017421245575, -0.0005132853984832764, -0.0004815533757209778, -0.0004498213529586792, -0.0004180893301963806, -0.00038635730743408203, -0.00035462528467178345, -0.00032289326190948486, -0.0002911612391471863, -0.0002594292163848877, -0.0002276971936225891, -0.00019596517086029053, -0.00016423314809799194, -0.00013250112533569336, -0.00010076910257339478, -6.903707981109619e-05, -3.730505704879761e-05, -5.5730342864990234e-06, 2.615898847579956e-05, 5.7891011238098145e-05, 8.962303400039673e-05, 0.00012135505676269531, 0.0001530870795249939, 0.00018481910228729248, 0.00021655112504959106, 0.00024828314781188965, 0.00028001517057418823, 0.0003117471933364868, 0.0003434792160987854, 0.000375211238861084, 0.00040694326162338257, 0.00043867528438568115, 0.00047040730714797974, 0.0005021393299102783, 0.0005338713526725769, 0.0005656033754348755, 0.0005973353981971741, 0.0006290674209594727, 0.0006607994437217712, 0.0006925314664840698, 0.0007242634892463684, 0.000755995512008667, 0.0007877275347709656, 0.0008194595575332642, 0.0008511915802955627, 0.0008829236030578613, 0.0009146556258201599, 0.0009463876485824585, 0.000978119671344757, 0.0010098516941070557, 0.0010415837168693542, 0.0010733157396316528, 0.0011050477623939514, 0.00113677978515625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 1.0, 11.0, 13.0, 20.0, 29.0, 58.0, 94.0, 184.0, 366.0, 765.0, 2126.0, 8569.0, 90460.0, 837881.0, 95623.0, 8687.0, 2121.0, 773.0, 361.0, 170.0, 82.0, 58.0, 33.0, 10.0, 18.0, 7.0, 10.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.85546875, -5.68072509765625, -5.5059814453125, -5.33123779296875, -5.156494140625, -4.98175048828125, -4.8070068359375, -4.63226318359375, -4.45751953125, -4.28277587890625, -4.1080322265625, -3.93328857421875, -3.758544921875, -3.58380126953125, -3.4090576171875, -3.23431396484375, -3.0595703125, -2.88482666015625, -2.7100830078125, -2.53533935546875, -2.360595703125, -2.18585205078125, -2.0111083984375, -1.83636474609375, -1.66162109375, -1.48687744140625, -1.3121337890625, -1.13739013671875, -0.962646484375, -0.78790283203125, -0.6131591796875, -0.43841552734375, -0.263671875, -0.08892822265625, 0.0858154296875, 0.26055908203125, 0.435302734375, 0.61004638671875, 0.7847900390625, 0.95953369140625, 1.13427734375, 1.30902099609375, 1.4837646484375, 1.65850830078125, 1.833251953125, 2.00799560546875, 2.1827392578125, 2.35748291015625, 2.5322265625, 2.70697021484375, 2.8817138671875, 3.05645751953125, 3.231201171875, 3.40594482421875, 3.5806884765625, 3.75543212890625, 3.93017578125, 4.10491943359375, 4.2796630859375, 4.45440673828125, 4.629150390625, 4.80389404296875, 4.9786376953125, 5.15338134765625, 5.328125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 8.0, 11.0, 10.0, 9.0, 21.0, 26.0, 34.0, 35.0, 64.0, 82.0, 104.0, 102.0, 104.0, 94.0, 56.0, 54.0, 42.0, 38.0, 25.0, 17.0, 17.0, 12.0, 14.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6015625, -3.488800048828125, -3.37603759765625, -3.263275146484375, -3.1505126953125, -3.037750244140625, -2.92498779296875, -2.812225341796875, -2.699462890625, -2.586700439453125, -2.47393798828125, -2.361175537109375, -2.2484130859375, -2.135650634765625, -2.02288818359375, -1.910125732421875, -1.79736328125, -1.684600830078125, -1.57183837890625, -1.459075927734375, -1.3463134765625, -1.233551025390625, -1.12078857421875, -1.008026123046875, -0.895263671875, -0.782501220703125, -0.66973876953125, -0.556976318359375, -0.4442138671875, -0.331451416015625, -0.21868896484375, -0.105926513671875, 0.0068359375, 0.119598388671875, 0.23236083984375, 0.345123291015625, 0.4578857421875, 0.570648193359375, 0.68341064453125, 0.796173095703125, 0.908935546875, 1.021697998046875, 1.13446044921875, 1.247222900390625, 1.3599853515625, 1.472747802734375, 1.58551025390625, 1.698272705078125, 1.81103515625, 1.923797607421875, 2.03656005859375, 2.149322509765625, 2.2620849609375, 2.374847412109375, 2.48760986328125, 2.600372314453125, 2.713134765625, 2.825897216796875, 2.93865966796875, 3.051422119140625, 3.1641845703125, 3.276947021484375, 3.38970947265625, 3.502471923828125, 3.615234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 20.0, 34.0, 100.0, 268.0, 303.0, 180.0, 56.0, 18.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.83934020996094, -107.05529022216797, -103.27123260498047, -99.4871826171875, -95.703125, -91.91907501220703, -88.13502502441406, -84.35096740722656, -80.5669174194336, -76.78286743164062, -72.99880981445312, -69.21475982666016, -65.43070983886719, -61.64665222167969, -57.86260223388672, -54.078548431396484, -50.29449462890625, -46.510440826416016, -42.72638702392578, -38.94233703613281, -35.15828323364258, -31.374229431152344, -27.590177536010742, -23.80612564086914, -20.022071838378906, -16.238018035888672, -12.45396614074707, -8.669913291931152, -4.885860443115234, -1.101806640625, 2.6822452545166016, 6.466297149658203, 10.250350952148438, 14.034403800964355, 17.818456649780273, 21.602508544921875, 25.38656234741211, 29.170616149902344, 32.95466613769531, 36.73871994018555, 40.52277374267578, 44.306827545166016, 48.09088134765625, 51.87493133544922, 55.65898513793945, 59.44303894042969, 63.227088928222656, 67.01113891601562, 70.79519653320312, 74.5792465209961, 78.3633041381836, 82.14735412597656, 85.93141174316406, 89.71546173095703, 93.49951171875, 97.2835693359375, 101.06761932373047, 104.85166931152344, 108.63572692871094, 112.4197769165039, 116.20382690429688, 119.98788452148438, 123.77193450927734, 127.55598449707031, 131.3400421142578]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 4.0, 7.0, 11.0, 11.0, 16.0, 18.0, 30.0, 30.0, 39.0, 47.0, 35.0, 52.0, 47.0, 59.0, 57.0, 63.0, 59.0, 52.0, 43.0, 47.0, 45.0, 42.0, 33.0, 31.0, 22.0, 23.0, 18.0, 18.0, 17.0, 9.0, 6.0, 6.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.24606704711914, -40.66707229614258, -39.08807373046875, -37.50907897949219, -35.930084228515625, -34.35108947753906, -32.772090911865234, -31.193096160888672, -29.61410140991211, -28.035104751586914, -26.45611000061035, -24.877113342285156, -23.298118591308594, -21.7191219329834, -20.140125274658203, -18.56113052368164, -16.982133865356445, -15.403138160705566, -13.824142456054688, -12.245145797729492, -10.66615104675293, -9.087154388427734, -7.5081586837768555, -5.929162979125977, -4.350167274475098, -2.7711715698242188, -1.1921756267547607, 0.38682031631469727, 1.9658160209655762, 3.544811725616455, 5.123807907104492, 6.702803611755371, 8.28179931640625, 9.860795021057129, 11.439790725708008, 13.018787384033203, 14.597782135009766, 16.17677879333496, 17.755775451660156, 19.33477020263672, 20.91376495361328, 22.492761611938477, 24.07175636291504, 25.650753021240234, 27.229747772216797, 28.808744430541992, 30.387741088867188, 31.96673583984375, 33.54573059082031, 35.124725341796875, 36.7037239074707, 38.282718658447266, 39.86171340942383, 41.44070816040039, 43.01970672607422, 44.59870147705078, 46.17770004272461, 47.75669479370117, 49.335693359375, 50.91468811035156, 52.493682861328125, 54.07267761230469, 55.651676177978516, 57.23067092895508, 58.80966567993164]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 11.0, 30.0, 22.0, 49.0, 63.0, 95.0, 180.0, 287.0, 468.0, 863.0, 1652.0, 3193.0, 6765.0, 14897.0, 37496.0, 119885.0, 615117.0, 2543572.0, 656635.0, 123603.0, 39101.0, 15573.0, 7249.0, 3478.0, 1763.0, 935.0, 518.0, 293.0, 171.0, 121.0, 65.0, 48.0, 16.0, 16.0, 11.0, 5.0, 5.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.255859375, -3.158721923828125, -3.06158447265625, -2.964447021484375, -2.8673095703125, -2.770172119140625, -2.67303466796875, -2.575897216796875, -2.478759765625, -2.381622314453125, -2.28448486328125, -2.187347412109375, -2.0902099609375, -1.993072509765625, -1.89593505859375, -1.798797607421875, -1.70166015625, -1.604522705078125, -1.50738525390625, -1.410247802734375, -1.3131103515625, -1.215972900390625, -1.11883544921875, -1.021697998046875, -0.924560546875, -0.827423095703125, -0.73028564453125, -0.633148193359375, -0.5360107421875, -0.438873291015625, -0.34173583984375, -0.244598388671875, -0.1474609375, -0.050323486328125, 0.04681396484375, 0.143951416015625, 0.2410888671875, 0.338226318359375, 0.43536376953125, 0.532501220703125, 0.629638671875, 0.726776123046875, 0.82391357421875, 0.921051025390625, 1.0181884765625, 1.115325927734375, 1.21246337890625, 1.309600830078125, 1.40673828125, 1.503875732421875, 1.60101318359375, 1.698150634765625, 1.7952880859375, 1.892425537109375, 1.98956298828125, 2.086700439453125, 2.183837890625, 2.280975341796875, 2.37811279296875, 2.475250244140625, 2.5723876953125, 2.669525146484375, 2.76666259765625, 2.863800048828125, 2.9609375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 9.0, 10.0, 13.0, 20.0, 40.0, 53.0, 59.0, 82.0, 105.0, 117.0, 102.0, 103.0, 80.0, 70.0, 54.0, 37.0, 14.0, 10.0, 10.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.4696044921875, -4.333740234375, -4.1978759765625, -4.06201171875, -3.9261474609375, -3.790283203125, -3.6544189453125, -3.5185546875, -3.3826904296875, -3.246826171875, -3.1109619140625, -2.97509765625, -2.8392333984375, -2.703369140625, -2.5675048828125, -2.431640625, -2.2957763671875, -2.159912109375, -2.0240478515625, -1.88818359375, -1.7523193359375, -1.616455078125, -1.4805908203125, -1.3447265625, -1.2088623046875, -1.072998046875, -0.9371337890625, -0.80126953125, -0.6654052734375, -0.529541015625, -0.3936767578125, -0.2578125, -0.1219482421875, 0.013916015625, 0.1497802734375, 0.28564453125, 0.4215087890625, 0.557373046875, 0.6932373046875, 0.8291015625, 0.9649658203125, 1.100830078125, 1.2366943359375, 1.37255859375, 1.5084228515625, 1.644287109375, 1.7801513671875, 1.916015625, 2.0518798828125, 2.187744140625, 2.3236083984375, 2.45947265625, 2.5953369140625, 2.731201171875, 2.8670654296875, 3.0029296875, 3.1387939453125, 3.274658203125, 3.4105224609375, 3.54638671875, 3.6822509765625, 3.818115234375, 3.9539794921875, 4.08984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 19.0, 25.0, 23.0, 47.0, 73.0, 171.0, 314.0, 792.0, 2108.0, 6446.0, 26021.0, 159156.0, 2942591.0, 959110.0, 75495.0, 15184.0, 4286.0, 1441.0, 477.0, 209.0, 111.0, 46.0, 38.0, 25.0, 19.0, 10.0, 12.0, 5.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.38671875, -5.19305419921875, -4.9993896484375, -4.80572509765625, -4.612060546875, -4.41839599609375, -4.2247314453125, -4.03106689453125, -3.83740234375, -3.64373779296875, -3.4500732421875, -3.25640869140625, -3.062744140625, -2.86907958984375, -2.6754150390625, -2.48175048828125, -2.2880859375, -2.09442138671875, -1.9007568359375, -1.70709228515625, -1.513427734375, -1.31976318359375, -1.1260986328125, -0.93243408203125, -0.73876953125, -0.54510498046875, -0.3514404296875, -0.15777587890625, 0.035888671875, 0.22955322265625, 0.4232177734375, 0.61688232421875, 0.810546875, 1.00421142578125, 1.1978759765625, 1.39154052734375, 1.585205078125, 1.77886962890625, 1.9725341796875, 2.16619873046875, 2.35986328125, 2.55352783203125, 2.7471923828125, 2.94085693359375, 3.134521484375, 3.32818603515625, 3.5218505859375, 3.71551513671875, 3.9091796875, 4.10284423828125, 4.2965087890625, 4.49017333984375, 4.683837890625, 4.87750244140625, 5.0711669921875, 5.26483154296875, 5.45849609375, 5.65216064453125, 5.8458251953125, 6.03948974609375, 6.233154296875, 6.42681884765625, 6.6204833984375, 6.81414794921875, 7.0078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 5.0, 8.0, 7.0, 12.0, 19.0, 29.0, 23.0, 40.0, 66.0, 88.0, 153.0, 312.0, 555.0, 870.0, 752.0, 423.0, 269.0, 136.0, 90.0, 59.0, 44.0, 29.0, 15.0, 18.0, 17.0, 7.0, 6.0, 3.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.30859375, -7.11566162109375, -6.9227294921875, -6.72979736328125, -6.536865234375, -6.34393310546875, -6.1510009765625, -5.95806884765625, -5.76513671875, -5.57220458984375, -5.3792724609375, -5.18634033203125, -4.993408203125, -4.80047607421875, -4.6075439453125, -4.41461181640625, -4.2216796875, -4.02874755859375, -3.8358154296875, -3.64288330078125, -3.449951171875, -3.25701904296875, -3.0640869140625, -2.87115478515625, -2.67822265625, -2.48529052734375, -2.2923583984375, -2.09942626953125, -1.906494140625, -1.71356201171875, -1.5206298828125, -1.32769775390625, -1.134765625, -0.94183349609375, -0.7489013671875, -0.55596923828125, -0.363037109375, -0.17010498046875, 0.0228271484375, 0.21575927734375, 0.40869140625, 0.60162353515625, 0.7945556640625, 0.98748779296875, 1.180419921875, 1.37335205078125, 1.5662841796875, 1.75921630859375, 1.9521484375, 2.14508056640625, 2.3380126953125, 2.53094482421875, 2.723876953125, 2.91680908203125, 3.1097412109375, 3.30267333984375, 3.49560546875, 3.68853759765625, 3.8814697265625, 4.07440185546875, 4.267333984375, 4.46026611328125, 4.6531982421875, 4.84613037109375, 5.0390625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 37.0, 82.0, 227.0, 274.0, 218.0, 80.0, 27.0, 18.0, 5.0, 2.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.96684265136719, -81.2141342163086, -78.46142578125, -75.70872497558594, -72.95601654052734, -70.20330810546875, -67.45059967041016, -64.69789123535156, -61.945186614990234, -59.19247817993164, -56.43977355957031, -53.68706512451172, -50.934356689453125, -48.1816520690918, -45.4289436340332, -42.676239013671875, -39.92353057861328, -37.17082214355469, -34.41811752319336, -31.665409088134766, -28.912702560424805, -26.159996032714844, -23.40728759765625, -20.65458106994629, -17.901874542236328, -15.149168014526367, -12.39646053314209, -9.643753051757812, -6.891046524047852, -4.138339996337891, -1.3856315612792969, 1.367074966430664, 4.119781494140625, 6.872488498687744, 9.625195503234863, 12.37790298461914, 15.130609512329102, 17.883316040039062, 20.636024475097656, 23.388731002807617, 26.141437530517578, 28.89414405822754, 31.6468505859375, 34.399559020996094, 37.15226745605469, 39.904972076416016, 42.65768051147461, 45.41038513183594, 48.16309356689453, 50.915802001953125, 53.66850662231445, 56.42121505737305, 59.173919677734375, 61.92662811279297, 64.67933654785156, 67.43204498291016, 70.18475341796875, 72.93746185302734, 75.69017028808594, 78.44287109375, 81.1955795288086, 83.94828796386719, 86.70099639892578, 89.45370483398438, 92.20640563964844]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 0.0, 4.0, 12.0, 9.0, 8.0, 21.0, 10.0, 18.0, 19.0, 19.0, 25.0, 32.0, 39.0, 40.0, 49.0, 52.0, 56.0, 61.0, 51.0, 47.0, 50.0, 46.0, 41.0, 47.0, 39.0, 24.0, 32.0, 27.0, 21.0, 22.0, 28.0, 15.0, 12.0, 4.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.606494903564453, -21.835792541503906, -21.06509017944336, -20.29438591003418, -19.523683547973633, -18.752981185913086, -17.982276916503906, -17.21157455444336, -16.440872192382812, -15.670169830322266, -14.899466514587402, -14.128763198852539, -13.358060836791992, -12.587358474731445, -11.816655158996582, -11.045951843261719, -10.275249481201172, -9.504547119140625, -8.733843803405762, -7.963140964508057, -7.192438125610352, -6.4217352867126465, -5.651032447814941, -4.880329608917236, -4.109626770019531, -3.338923931121826, -2.568221092224121, -1.797518253326416, -1.026815414428711, -0.25611257553100586, 0.5145902633666992, 1.2852931022644043, 2.0559940338134766, 2.8266968727111816, 3.5973997116088867, 4.368102550506592, 5.138805389404297, 5.909508228302002, 6.680211067199707, 7.450913906097412, 8.221616744995117, 8.992319107055664, 9.763022422790527, 10.53372573852539, 11.304428100585938, 12.075130462646484, 12.845833778381348, 13.616537094116211, 14.387239456176758, 15.157941818237305, 15.928645133972168, 16.69934844970703, 17.470050811767578, 18.240753173828125, 19.011455535888672, 19.78215980529785, 20.5528621673584, 21.323564529418945, 22.094268798828125, 22.864971160888672, 23.63567352294922, 24.406375885009766, 25.177078247070312, 25.947782516479492, 26.71848487854004]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 12.0, 16.0, 27.0, 44.0, 62.0, 117.0, 204.0, 478.0, 881.0, 1868.0, 4313.0, 10508.0, 30159.0, 99580.0, 493398.0, 305346.0, 66052.0, 21417.0, 7837.0, 3215.0, 1479.0, 717.0, 382.0, 192.0, 102.0, 60.0, 35.0, 22.0, 9.0, 8.0, 4.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40234375, -6.2073974609375, -6.012451171875, -5.8175048828125, -5.62255859375, -5.4276123046875, -5.232666015625, -5.0377197265625, -4.8427734375, -4.6478271484375, -4.452880859375, -4.2579345703125, -4.06298828125, -3.8680419921875, -3.673095703125, -3.4781494140625, -3.283203125, -3.0882568359375, -2.893310546875, -2.6983642578125, -2.50341796875, -2.3084716796875, -2.113525390625, -1.9185791015625, -1.7236328125, -1.5286865234375, -1.333740234375, -1.1387939453125, -0.94384765625, -0.7489013671875, -0.553955078125, -0.3590087890625, -0.1640625, 0.0308837890625, 0.225830078125, 0.4207763671875, 0.61572265625, 0.8106689453125, 1.005615234375, 1.2005615234375, 1.3955078125, 1.5904541015625, 1.785400390625, 1.9803466796875, 2.17529296875, 2.3702392578125, 2.565185546875, 2.7601318359375, 2.955078125, 3.1500244140625, 3.344970703125, 3.5399169921875, 3.73486328125, 3.9298095703125, 4.124755859375, 4.3197021484375, 4.5146484375, 4.7095947265625, 4.904541015625, 5.0994873046875, 5.29443359375, 5.4893798828125, 5.684326171875, 5.8792724609375, 6.07421875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 10.0, 11.0, 17.0, 40.0, 44.0, 72.0, 66.0, 79.0, 92.0, 89.0, 106.0, 94.0, 82.0, 55.0, 45.0, 32.0, 29.0, 15.0, 6.0, 9.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.0546875, -4.923614501953125, -4.79254150390625, -4.661468505859375, -4.5303955078125, -4.399322509765625, -4.26824951171875, -4.137176513671875, -4.006103515625, -3.875030517578125, -3.74395751953125, -3.612884521484375, -3.4818115234375, -3.350738525390625, -3.21966552734375, -3.088592529296875, -2.95751953125, -2.826446533203125, -2.69537353515625, -2.564300537109375, -2.4332275390625, -2.302154541015625, -2.17108154296875, -2.040008544921875, -1.908935546875, -1.777862548828125, -1.64678955078125, -1.515716552734375, -1.3846435546875, -1.253570556640625, -1.12249755859375, -0.991424560546875, -0.8603515625, -0.729278564453125, -0.59820556640625, -0.467132568359375, -0.3360595703125, -0.204986572265625, -0.07391357421875, 0.057159423828125, 0.188232421875, 0.319305419921875, 0.45037841796875, 0.581451416015625, 0.7125244140625, 0.843597412109375, 0.97467041015625, 1.105743408203125, 1.23681640625, 1.367889404296875, 1.49896240234375, 1.630035400390625, 1.7611083984375, 1.892181396484375, 2.02325439453125, 2.154327392578125, 2.285400390625, 2.416473388671875, 2.54754638671875, 2.678619384765625, 2.8096923828125, 2.940765380859375, 3.07183837890625, 3.202911376953125, 3.333984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 8.0, 8.0, 5.0, 8.0, 11.0, 9.0, 20.0, 16.0, 31.0, 63.0, 70.0, 97.0, 154.0, 229.0, 418.0, 723.0, 1632.0, 4359.0, 23167.0, 595613.0, 395382.0, 19106.0, 4054.0, 1555.0, 689.0, 379.0, 263.0, 155.0, 93.0, 66.0, 47.0, 38.0, 26.0, 11.0, 12.0, 10.0, 3.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.6015625, -13.1475830078125, -12.693603515625, -12.2396240234375, -11.78564453125, -11.3316650390625, -10.877685546875, -10.4237060546875, -9.9697265625, -9.5157470703125, -9.061767578125, -8.6077880859375, -8.15380859375, -7.6998291015625, -7.245849609375, -6.7918701171875, -6.337890625, -5.8839111328125, -5.429931640625, -4.9759521484375, -4.52197265625, -4.0679931640625, -3.614013671875, -3.1600341796875, -2.7060546875, -2.2520751953125, -1.798095703125, -1.3441162109375, -0.89013671875, -0.4361572265625, 0.017822265625, 0.4718017578125, 0.92578125, 1.3797607421875, 1.833740234375, 2.2877197265625, 2.74169921875, 3.1956787109375, 3.649658203125, 4.1036376953125, 4.5576171875, 5.0115966796875, 5.465576171875, 5.9195556640625, 6.37353515625, 6.8275146484375, 7.281494140625, 7.7354736328125, 8.189453125, 8.6434326171875, 9.097412109375, 9.5513916015625, 10.00537109375, 10.4593505859375, 10.913330078125, 11.3673095703125, 11.8212890625, 12.2752685546875, 12.729248046875, 13.1832275390625, 13.63720703125, 14.0911865234375, 14.545166015625, 14.9991455078125, 15.453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 10.0, 15.0, 20.0, 13.0, 37.0, 50.0, 47.0, 56.0, 74.0, 62.0, 90.0, 85.0, 74.0, 59.0, 47.0, 61.0, 50.0, 37.0, 26.0, 19.0, 17.0, 9.0, 5.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.494140625, -16.91015625, -16.326171875, -15.7421875, -15.158203125, -14.57421875, -13.990234375, -13.40625, -12.822265625, -12.23828125, -11.654296875, -11.0703125, -10.486328125, -9.90234375, -9.318359375, -8.734375, -8.150390625, -7.56640625, -6.982421875, -6.3984375, -5.814453125, -5.23046875, -4.646484375, -4.0625, -3.478515625, -2.89453125, -2.310546875, -1.7265625, -1.142578125, -0.55859375, 0.025390625, 0.609375, 1.193359375, 1.77734375, 2.361328125, 2.9453125, 3.529296875, 4.11328125, 4.697265625, 5.28125, 5.865234375, 6.44921875, 7.033203125, 7.6171875, 8.201171875, 8.78515625, 9.369140625, 9.953125, 10.537109375, 11.12109375, 11.705078125, 12.2890625, 12.873046875, 13.45703125, 14.041015625, 14.625, 15.208984375, 15.79296875, 16.376953125, 16.9609375, 17.544921875, 18.12890625, 18.712890625, 19.296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 9.0, 14.0, 28.0, 33.0, 48.0, 95.0, 189.0, 457.0, 1634.0, 9199.0, 189973.0, 822494.0, 20417.0, 2668.0, 716.0, 266.0, 127.0, 71.0, 40.0, 13.0, 13.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.6953125, -10.42901611328125, -10.1627197265625, -9.89642333984375, -9.630126953125, -9.36383056640625, -9.0975341796875, -8.83123779296875, -8.56494140625, -8.29864501953125, -8.0323486328125, -7.76605224609375, -7.499755859375, -7.23345947265625, -6.9671630859375, -6.70086669921875, -6.4345703125, -6.16827392578125, -5.9019775390625, -5.63568115234375, -5.369384765625, -5.10308837890625, -4.8367919921875, -4.57049560546875, -4.30419921875, -4.03790283203125, -3.7716064453125, -3.50531005859375, -3.239013671875, -2.97271728515625, -2.7064208984375, -2.44012451171875, -2.173828125, -1.90753173828125, -1.6412353515625, -1.37493896484375, -1.108642578125, -0.84234619140625, -0.5760498046875, -0.30975341796875, -0.04345703125, 0.22283935546875, 0.4891357421875, 0.75543212890625, 1.021728515625, 1.28802490234375, 1.5543212890625, 1.82061767578125, 2.0869140625, 2.35321044921875, 2.6195068359375, 2.88580322265625, 3.152099609375, 3.41839599609375, 3.6846923828125, 3.95098876953125, 4.21728515625, 4.48358154296875, 4.7498779296875, 5.01617431640625, 5.282470703125, 5.54876708984375, 5.8150634765625, 6.08135986328125, 6.34765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 7.0, 14.0, 5.0, 16.0, 16.0, 33.0, 38.0, 66.0, 135.0, 242.0, 162.0, 74.0, 42.0, 30.0, 19.0, 17.0, 26.0, 11.0, 13.0, 3.0, 7.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010089874267578125, -0.0009696930646896362, -0.00093039870262146, -0.0008911043405532837, -0.0008518099784851074, -0.0008125156164169312, -0.0007732212543487549, -0.0007339268922805786, -0.0006946325302124023, -0.0006553381681442261, -0.0006160438060760498, -0.0005767494440078735, -0.0005374550819396973, -0.000498160719871521, -0.0004588663578033447, -0.00041957199573516846, -0.0003802776336669922, -0.0003409832715988159, -0.00030168890953063965, -0.0002623945474624634, -0.0002231001853942871, -0.00018380582332611084, -0.00014451146125793457, -0.0001052170991897583, -6.592273712158203e-05, -2.6628375053405762e-05, 1.2665987014770508e-05, 5.196034908294678e-05, 9.125471115112305e-05, 0.00013054907321929932, 0.00016984343528747559, 0.00020913779735565186, 0.0002484321594238281, 0.0002877265214920044, 0.00032702088356018066, 0.00036631524562835693, 0.0004056096076965332, 0.00044490396976470947, 0.00048419833183288574, 0.000523492693901062, 0.0005627870559692383, 0.0006020814180374146, 0.0006413757801055908, 0.0006806701421737671, 0.0007199645042419434, 0.0007592588663101196, 0.0007985532283782959, 0.0008378475904464722, 0.0008771419525146484, 0.0009164363145828247, 0.000955730676651001, 0.0009950250387191772, 0.0010343194007873535, 0.0010736137628555298, 0.001112908124923706, 0.0011522024869918823, 0.0011914968490600586, 0.0012307912111282349, 0.0012700855731964111, 0.0013093799352645874, 0.0013486742973327637, 0.00138796865940094, 0.0014272630214691162, 0.0014665573835372925, 0.0015058517456054688]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 12.0, 14.0, 32.0, 31.0, 42.0, 67.0, 101.0, 166.0, 358.0, 669.0, 1536.0, 4532.0, 21171.0, 272908.0, 700515.0, 36234.0, 6420.0, 1976.0, 827.0, 357.0, 214.0, 118.0, 93.0, 45.0, 41.0, 16.0, 19.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.41796875, -5.23199462890625, -5.0460205078125, -4.86004638671875, -4.674072265625, -4.48809814453125, -4.3021240234375, -4.11614990234375, -3.93017578125, -3.74420166015625, -3.5582275390625, -3.37225341796875, -3.186279296875, -3.00030517578125, -2.8143310546875, -2.62835693359375, -2.4423828125, -2.25640869140625, -2.0704345703125, -1.88446044921875, -1.698486328125, -1.51251220703125, -1.3265380859375, -1.14056396484375, -0.95458984375, -0.76861572265625, -0.5826416015625, -0.39666748046875, -0.210693359375, -0.02471923828125, 0.1612548828125, 0.34722900390625, 0.533203125, 0.71917724609375, 0.9051513671875, 1.09112548828125, 1.277099609375, 1.46307373046875, 1.6490478515625, 1.83502197265625, 2.02099609375, 2.20697021484375, 2.3929443359375, 2.57891845703125, 2.764892578125, 2.95086669921875, 3.1368408203125, 3.32281494140625, 3.5087890625, 3.69476318359375, 3.8807373046875, 4.06671142578125, 4.252685546875, 4.43865966796875, 4.6246337890625, 4.81060791015625, 4.99658203125, 5.18255615234375, 5.3685302734375, 5.55450439453125, 5.740478515625, 5.92645263671875, 6.1124267578125, 6.29840087890625, 6.484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 17.0, 9.0, 16.0, 22.0, 22.0, 34.0, 43.0, 47.0, 90.0, 95.0, 118.0, 105.0, 87.0, 77.0, 52.0, 32.0, 25.0, 14.0, 16.0, 16.0, 11.0, 13.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.40032958984375, -4.2655029296875, -4.13067626953125, -3.995849609375, -3.86102294921875, -3.7261962890625, -3.59136962890625, -3.45654296875, -3.32171630859375, -3.1868896484375, -3.05206298828125, -2.917236328125, -2.78240966796875, -2.6475830078125, -2.51275634765625, -2.3779296875, -2.24310302734375, -2.1082763671875, -1.97344970703125, -1.838623046875, -1.70379638671875, -1.5689697265625, -1.43414306640625, -1.29931640625, -1.16448974609375, -1.0296630859375, -0.89483642578125, -0.760009765625, -0.62518310546875, -0.4903564453125, -0.35552978515625, -0.220703125, -0.08587646484375, 0.0489501953125, 0.18377685546875, 0.318603515625, 0.45343017578125, 0.5882568359375, 0.72308349609375, 0.85791015625, 0.99273681640625, 1.1275634765625, 1.26239013671875, 1.397216796875, 1.53204345703125, 1.6668701171875, 1.80169677734375, 1.9365234375, 2.07135009765625, 2.2061767578125, 2.34100341796875, 2.475830078125, 2.61065673828125, 2.7454833984375, 2.88031005859375, 3.01513671875, 3.14996337890625, 3.2847900390625, 3.41961669921875, 3.554443359375, 3.68927001953125, 3.8240966796875, 3.95892333984375, 4.09375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 16.0, 53.0, 174.0, 350.0, 247.0, 96.0, 36.0, 9.0, 10.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-161.52520751953125, -157.45751953125, -153.3898162841797, -149.32212829589844, -145.25442504882812, -141.18673706054688, -137.11903381347656, -133.0513458251953, -128.983642578125, -124.91594696044922, -120.84825134277344, -116.78055572509766, -112.71286010742188, -108.6451644897461, -104.57746887207031, -100.50978088378906, -96.44208526611328, -92.3743896484375, -88.30669403076172, -84.23899841308594, -80.17130279541016, -76.10360717773438, -72.03591918945312, -67.96821594238281, -63.9005241394043, -59.832828521728516, -55.765132904052734, -51.69744110107422, -47.62974548339844, -43.562049865722656, -39.494354248046875, -35.426658630371094, -31.35895538330078, -27.291259765625, -23.22356414794922, -19.15587043762207, -15.088174819946289, -11.020479202270508, -6.952785491943359, -2.885089874267578, 1.1826057434082031, 5.250300884246826, 9.31799602508545, 13.385690689086914, 17.453386306762695, 21.521081924438477, 25.588775634765625, 29.656471252441406, 33.72416687011719, 37.79186248779297, 41.85955810546875, 45.92725372314453, 49.99494934082031, 54.062644958496094, 58.13033676147461, 62.19803237915039, 66.26573181152344, 70.33342742919922, 74.401123046875, 78.46881866455078, 82.53651428222656, 86.60420989990234, 90.67190551757812, 94.73959350585938, 98.80728912353516]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 7.0, 9.0, 14.0, 8.0, 14.0, 21.0, 21.0, 25.0, 29.0, 28.0, 34.0, 46.0, 51.0, 49.0, 58.0, 55.0, 60.0, 59.0, 63.0, 58.0, 38.0, 45.0, 39.0, 29.0, 28.0, 24.0, 17.0, 19.0, 9.0, 6.0, 5.0, 8.0, 4.0, 6.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.771949768066406, -42.222129821777344, -40.67230987548828, -39.122493743896484, -37.57267379760742, -36.02285385131836, -34.47303771972656, -32.9232177734375, -31.373397827148438, -29.823577880859375, -28.273759841918945, -26.723941802978516, -25.174121856689453, -23.62430191040039, -22.07448387145996, -20.52466583251953, -18.97484588623047, -17.425025939941406, -15.875207901000977, -14.32538890838623, -12.775569915771484, -11.225750923156738, -9.675931930541992, -8.126112937927246, -6.5762939453125, -5.026474952697754, -3.476655960083008, -1.9268369674682617, -0.3770179748535156, 1.1728010177612305, 2.7226200103759766, 4.272439002990723, 5.822261810302734, 7.3720808029174805, 8.921899795532227, 10.471718788146973, 12.021537780761719, 13.571356773376465, 15.121175765991211, 16.67099380493164, 18.220813751220703, 19.770633697509766, 21.320451736450195, 22.870269775390625, 24.420089721679688, 25.96990966796875, 27.51972770690918, 29.06954574584961, 30.619365692138672, 32.169185638427734, 33.71900177001953, 35.268821716308594, 36.818641662597656, 38.36846160888672, 39.91828155517578, 41.46809768676758, 43.01791763305664, 44.5677375793457, 46.1175537109375, 47.66737365722656, 49.217193603515625, 50.76701354980469, 52.31683349609375, 53.86664962768555, 55.41646957397461]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 12.0, 16.0, 19.0, 31.0, 54.0, 76.0, 124.0, 248.0, 1270.0, 296401.0, 3891773.0, 3467.0, 360.0, 173.0, 77.0, 62.0, 36.0, 18.0, 15.0, 10.0, 8.0, 8.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.828125, -30.096435546875, -29.36474609375, -28.633056640625, -27.9013671875, -27.169677734375, -26.43798828125, -25.706298828125, -24.974609375, -24.242919921875, -23.51123046875, -22.779541015625, -22.0478515625, -21.316162109375, -20.58447265625, -19.852783203125, -19.12109375, -18.389404296875, -17.65771484375, -16.926025390625, -16.1943359375, -15.462646484375, -14.73095703125, -13.999267578125, -13.267578125, -12.535888671875, -11.80419921875, -11.072509765625, -10.3408203125, -9.609130859375, -8.87744140625, -8.145751953125, -7.4140625, -6.682373046875, -5.95068359375, -5.218994140625, -4.4873046875, -3.755615234375, -3.02392578125, -2.292236328125, -1.560546875, -0.828857421875, -0.09716796875, 0.634521484375, 1.3662109375, 2.097900390625, 2.82958984375, 3.561279296875, 4.29296875, 5.024658203125, 5.75634765625, 6.488037109375, 7.2197265625, 7.951416015625, 8.68310546875, 9.414794921875, 10.146484375, 10.878173828125, 11.60986328125, 12.341552734375, 13.0732421875, 13.804931640625, 14.53662109375, 15.268310546875, 16.0]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 4.0, 12.0, 6.0, 14.0, 22.0, 37.0, 41.0, 63.0, 79.0, 94.0, 88.0, 111.0, 79.0, 86.0, 56.0, 58.0, 57.0, 32.0, 23.0, 15.0, 13.0, 6.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.54296875, -3.41412353515625, -3.2852783203125, -3.15643310546875, -3.027587890625, -2.89874267578125, -2.7698974609375, -2.64105224609375, -2.51220703125, -2.38336181640625, -2.2545166015625, -2.12567138671875, -1.996826171875, -1.86798095703125, -1.7391357421875, -1.61029052734375, -1.4814453125, -1.35260009765625, -1.2237548828125, -1.09490966796875, -0.966064453125, -0.83721923828125, -0.7083740234375, -0.57952880859375, -0.45068359375, -0.32183837890625, -0.1929931640625, -0.06414794921875, 0.064697265625, 0.19354248046875, 0.3223876953125, 0.45123291015625, 0.580078125, 0.70892333984375, 0.8377685546875, 0.96661376953125, 1.095458984375, 1.22430419921875, 1.3531494140625, 1.48199462890625, 1.61083984375, 1.73968505859375, 1.8685302734375, 1.99737548828125, 2.126220703125, 2.25506591796875, 2.3839111328125, 2.51275634765625, 2.6416015625, 2.77044677734375, 2.8992919921875, 3.02813720703125, 3.156982421875, 3.28582763671875, 3.4146728515625, 3.54351806640625, 3.67236328125, 3.80120849609375, 3.9300537109375, 4.05889892578125, 4.187744140625, 4.31658935546875, 4.4454345703125, 4.57427978515625, 4.703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 10.0, 21.0, 19.0, 33.0, 43.0, 73.0, 92.0, 158.0, 244.0, 416.0, 613.0, 1172.0, 2168.0, 4224.0, 8951.0, 20816.0, 58160.0, 224626.0, 1457818.0, 1990817.0, 305341.0, 73290.0, 24448.0, 10415.0, 4835.0, 2305.0, 1209.0, 734.0, 435.0, 265.0, 158.0, 118.0, 68.0, 52.0, 35.0, 32.0, 17.0, 15.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.798828125, -3.690582275390625, -3.58233642578125, -3.474090576171875, -3.3658447265625, -3.257598876953125, -3.14935302734375, -3.041107177734375, -2.932861328125, -2.824615478515625, -2.71636962890625, -2.608123779296875, -2.4998779296875, -2.391632080078125, -2.28338623046875, -2.175140380859375, -2.06689453125, -1.958648681640625, -1.85040283203125, -1.742156982421875, -1.6339111328125, -1.525665283203125, -1.41741943359375, -1.309173583984375, -1.200927734375, -1.092681884765625, -0.98443603515625, -0.876190185546875, -0.7679443359375, -0.659698486328125, -0.55145263671875, -0.443206787109375, -0.3349609375, -0.226715087890625, -0.11846923828125, -0.010223388671875, 0.0980224609375, 0.206268310546875, 0.31451416015625, 0.422760009765625, 0.531005859375, 0.639251708984375, 0.74749755859375, 0.855743408203125, 0.9639892578125, 1.072235107421875, 1.18048095703125, 1.288726806640625, 1.39697265625, 1.505218505859375, 1.61346435546875, 1.721710205078125, 1.8299560546875, 1.938201904296875, 2.04644775390625, 2.154693603515625, 2.262939453125, 2.371185302734375, 2.47943115234375, 2.587677001953125, 2.6959228515625, 2.804168701171875, 2.91241455078125, 3.020660400390625, 3.12890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 7.0, 7.0, 8.0, 12.0, 28.0, 32.0, 50.0, 88.0, 118.0, 214.0, 400.0, 688.0, 871.0, 630.0, 375.0, 207.0, 124.0, 67.0, 51.0, 29.0, 16.0, 14.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.078125, -5.87841796875, -5.6787109375, -5.47900390625, -5.279296875, -5.07958984375, -4.8798828125, -4.68017578125, -4.48046875, -4.28076171875, -4.0810546875, -3.88134765625, -3.681640625, -3.48193359375, -3.2822265625, -3.08251953125, -2.8828125, -2.68310546875, -2.4833984375, -2.28369140625, -2.083984375, -1.88427734375, -1.6845703125, -1.48486328125, -1.28515625, -1.08544921875, -0.8857421875, -0.68603515625, -0.486328125, -0.28662109375, -0.0869140625, 0.11279296875, 0.3125, 0.51220703125, 0.7119140625, 0.91162109375, 1.111328125, 1.31103515625, 1.5107421875, 1.71044921875, 1.91015625, 2.10986328125, 2.3095703125, 2.50927734375, 2.708984375, 2.90869140625, 3.1083984375, 3.30810546875, 3.5078125, 3.70751953125, 3.9072265625, 4.10693359375, 4.306640625, 4.50634765625, 4.7060546875, 4.90576171875, 5.10546875, 5.30517578125, 5.5048828125, 5.70458984375, 5.904296875, 6.10400390625, 6.3037109375, 6.50341796875, 6.703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 6.0, 6.0, 12.0, 27.0, 99.0, 229.0, 294.0, 201.0, 77.0, 26.0, 14.0, 6.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-99.131591796875, -96.42340087890625, -93.7152099609375, -91.00701904296875, -88.298828125, -85.59063720703125, -82.8824462890625, -80.17426300048828, -77.46607208251953, -74.75788116455078, -72.04969024658203, -69.34149932861328, -66.63330841064453, -63.92512130737305, -61.2169303894043, -58.50874328613281, -55.8005485534668, -53.09235763549805, -50.3841667175293, -47.67597961425781, -44.96778869628906, -42.25959777832031, -39.55140686035156, -36.84321594238281, -34.13502502441406, -31.426834106445312, -28.718645095825195, -26.010454177856445, -23.302265167236328, -20.594074249267578, -17.885883331298828, -15.177694320678711, -12.469505310058594, -9.76131534576416, -7.053124904632568, -4.344934463500977, -1.636744499206543, 1.0714454650878906, 3.7796363830566406, 6.487825393676758, 9.196016311645508, 11.904206275939941, 14.612396240234375, 17.320587158203125, 20.028778076171875, 22.736967086791992, 25.445158004760742, 28.15334701538086, 30.86153793334961, 33.56972885131836, 36.27791976928711, 38.986106872558594, 41.694297790527344, 44.402488708496094, 47.110679626464844, 49.818870544433594, 52.527061462402344, 55.235252380371094, 57.943443298339844, 60.651634216308594, 63.35982131958008, 66.06800842285156, 68.77619934082031, 71.48439025878906, 74.19258117675781]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 8.0, 12.0, 11.0, 19.0, 14.0, 26.0, 23.0, 24.0, 22.0, 37.0, 35.0, 33.0, 44.0, 61.0, 41.0, 44.0, 41.0, 51.0, 56.0, 60.0, 35.0, 37.0, 26.0, 32.0, 31.0, 33.0, 20.0, 19.0, 18.0, 13.0, 10.0, 11.0, 12.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-26.399124145507812, -25.634071350097656, -24.8690185546875, -24.10396385192871, -23.338911056518555, -22.5738582611084, -21.80880355834961, -21.043750762939453, -20.278697967529297, -19.51364517211914, -18.748592376708984, -17.983537673950195, -17.21848487854004, -16.453432083129883, -15.68837833404541, -14.923324584960938, -14.158271789550781, -13.393218994140625, -12.628165245056152, -11.86311149597168, -11.098058700561523, -10.333005905151367, -9.567952156066895, -8.802898406982422, -8.037845611572266, -7.272792339324951, -6.507739067077637, -5.742685794830322, -4.977632522583008, -4.212579250335693, -3.447525978088379, -2.6824727058410645, -1.9174213409423828, -1.1523680686950684, -0.3873147964477539, 0.37773847579956055, 1.142791748046875, 1.9078450202941895, 2.672898292541504, 3.4379515647888184, 4.203004837036133, 4.968058109283447, 5.733111381530762, 6.498164653778076, 7.263217926025391, 8.028270721435547, 8.79332447052002, 9.558378219604492, 10.323431015014648, 11.088483810424805, 11.853537559509277, 12.61859130859375, 13.383644104003906, 14.148696899414062, 14.913750648498535, 15.678804397583008, 16.443857192993164, 17.20890998840332, 17.97396469116211, 18.739017486572266, 19.504070281982422, 20.269123077392578, 21.034175872802734, 21.799230575561523, 22.56428337097168]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 4.0, 8.0, 21.0, 20.0, 24.0, 52.0, 93.0, 112.0, 177.0, 294.0, 545.0, 912.0, 1762.0, 3412.0, 7370.0, 16662.0, 40089.0, 127377.0, 470863.0, 264730.0, 67078.0, 25389.0, 10943.0, 5026.0, 2561.0, 1265.0, 709.0, 403.0, 224.0, 130.0, 90.0, 73.0, 49.0, 24.0, 19.0, 8.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.91986083984375, -3.7733154296875, -3.62677001953125, -3.480224609375, -3.33367919921875, -3.1871337890625, -3.04058837890625, -2.89404296875, -2.74749755859375, -2.6009521484375, -2.45440673828125, -2.307861328125, -2.16131591796875, -2.0147705078125, -1.86822509765625, -1.7216796875, -1.57513427734375, -1.4285888671875, -1.28204345703125, -1.135498046875, -0.98895263671875, -0.8424072265625, -0.69586181640625, -0.54931640625, -0.40277099609375, -0.2562255859375, -0.10968017578125, 0.036865234375, 0.18341064453125, 0.3299560546875, 0.47650146484375, 0.623046875, 0.76959228515625, 0.9161376953125, 1.06268310546875, 1.209228515625, 1.35577392578125, 1.5023193359375, 1.64886474609375, 1.79541015625, 1.94195556640625, 2.0885009765625, 2.23504638671875, 2.381591796875, 2.52813720703125, 2.6746826171875, 2.82122802734375, 2.9677734375, 3.11431884765625, 3.2608642578125, 3.40740966796875, 3.553955078125, 3.70050048828125, 3.8470458984375, 3.99359130859375, 4.14013671875, 4.28668212890625, 4.4332275390625, 4.57977294921875, 4.726318359375, 4.87286376953125, 5.0194091796875, 5.16595458984375, 5.3125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 11.0, 12.0, 18.0, 25.0, 23.0, 28.0, 36.0, 37.0, 45.0, 50.0, 57.0, 57.0, 54.0, 63.0, 57.0, 57.0, 50.0, 55.0, 59.0, 35.0, 32.0, 25.0, 21.0, 26.0, 14.0, 10.0, 14.0, 4.0, 3.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.078125, -2.991485595703125, -2.90484619140625, -2.818206787109375, -2.7315673828125, -2.644927978515625, -2.55828857421875, -2.471649169921875, -2.385009765625, -2.298370361328125, -2.21173095703125, -2.125091552734375, -2.0384521484375, -1.951812744140625, -1.86517333984375, -1.778533935546875, -1.69189453125, -1.605255126953125, -1.51861572265625, -1.431976318359375, -1.3453369140625, -1.258697509765625, -1.17205810546875, -1.085418701171875, -0.998779296875, -0.912139892578125, -0.82550048828125, -0.738861083984375, -0.6522216796875, -0.565582275390625, -0.47894287109375, -0.392303466796875, -0.3056640625, -0.219024658203125, -0.13238525390625, -0.045745849609375, 0.0408935546875, 0.127532958984375, 0.21417236328125, 0.300811767578125, 0.387451171875, 0.474090576171875, 0.56072998046875, 0.647369384765625, 0.7340087890625, 0.820648193359375, 0.90728759765625, 0.993927001953125, 1.08056640625, 1.167205810546875, 1.25384521484375, 1.340484619140625, 1.4271240234375, 1.513763427734375, 1.60040283203125, 1.687042236328125, 1.773681640625, 1.860321044921875, 1.94696044921875, 2.033599853515625, 2.1202392578125, 2.206878662109375, 2.29351806640625, 2.380157470703125, 2.466796875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 6.0, 2.0, 6.0, 8.0, 8.0, 13.0, 24.0, 29.0, 44.0, 47.0, 85.0, 88.0, 140.0, 246.0, 341.0, 523.0, 845.0, 1603.0, 3240.0, 8263.0, 27236.0, 136655.0, 703247.0, 125172.0, 25697.0, 7969.0, 3070.0, 1537.0, 850.0, 524.0, 323.0, 201.0, 167.0, 74.0, 71.0, 52.0, 41.0, 26.0, 15.0, 15.0, 14.0, 10.0, 11.0, 7.0, 11.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.1484375, -7.91876220703125, -7.6890869140625, -7.45941162109375, -7.229736328125, -7.00006103515625, -6.7703857421875, -6.54071044921875, -6.31103515625, -6.08135986328125, -5.8516845703125, -5.62200927734375, -5.392333984375, -5.16265869140625, -4.9329833984375, -4.70330810546875, -4.4736328125, -4.24395751953125, -4.0142822265625, -3.78460693359375, -3.554931640625, -3.32525634765625, -3.0955810546875, -2.86590576171875, -2.63623046875, -2.40655517578125, -2.1768798828125, -1.94720458984375, -1.717529296875, -1.48785400390625, -1.2581787109375, -1.02850341796875, -0.798828125, -0.56915283203125, -0.3394775390625, -0.10980224609375, 0.119873046875, 0.34954833984375, 0.5792236328125, 0.80889892578125, 1.03857421875, 1.26824951171875, 1.4979248046875, 1.72760009765625, 1.957275390625, 2.18695068359375, 2.4166259765625, 2.64630126953125, 2.8759765625, 3.10565185546875, 3.3353271484375, 3.56500244140625, 3.794677734375, 4.02435302734375, 4.2540283203125, 4.48370361328125, 4.71337890625, 4.94305419921875, 5.1727294921875, 5.40240478515625, 5.632080078125, 5.86175537109375, 6.0914306640625, 6.32110595703125, 6.55078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 8.0, 2.0, 6.0, 9.0, 8.0, 12.0, 10.0, 21.0, 16.0, 25.0, 26.0, 30.0, 46.0, 49.0, 40.0, 45.0, 39.0, 54.0, 65.0, 58.0, 48.0, 58.0, 39.0, 40.0, 43.0, 34.0, 29.0, 27.0, 23.0, 20.0, 21.0, 10.0, 11.0, 4.0, 9.0, 4.0, 4.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8671875, -12.5164794921875, -12.165771484375, -11.8150634765625, -11.46435546875, -11.1136474609375, -10.762939453125, -10.4122314453125, -10.0615234375, -9.7108154296875, -9.360107421875, -9.0093994140625, -8.65869140625, -8.3079833984375, -7.957275390625, -7.6065673828125, -7.255859375, -6.9051513671875, -6.554443359375, -6.2037353515625, -5.85302734375, -5.5023193359375, -5.151611328125, -4.8009033203125, -4.4501953125, -4.0994873046875, -3.748779296875, -3.3980712890625, -3.04736328125, -2.6966552734375, -2.345947265625, -1.9952392578125, -1.64453125, -1.2938232421875, -0.943115234375, -0.5924072265625, -0.24169921875, 0.1090087890625, 0.459716796875, 0.8104248046875, 1.1611328125, 1.5118408203125, 1.862548828125, 2.2132568359375, 2.56396484375, 2.9146728515625, 3.265380859375, 3.6160888671875, 3.966796875, 4.3175048828125, 4.668212890625, 5.0189208984375, 5.36962890625, 5.7203369140625, 6.071044921875, 6.4217529296875, 6.7724609375, 7.1231689453125, 7.473876953125, 7.8245849609375, 8.17529296875, 8.5260009765625, 8.876708984375, 9.2274169921875, 9.578125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 11.0, 13.0, 26.0, 53.0, 99.0, 265.0, 1144.0, 8659.0, 522429.0, 505412.0, 8798.0, 1120.0, 255.0, 113.0, 55.0, 25.0, 24.0, 13.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.1204833984375, -7.795654296875, -7.4708251953125, -7.14599609375, -6.8211669921875, -6.496337890625, -6.1715087890625, -5.8466796875, -5.5218505859375, -5.197021484375, -4.8721923828125, -4.54736328125, -4.2225341796875, -3.897705078125, -3.5728759765625, -3.248046875, -2.9232177734375, -2.598388671875, -2.2735595703125, -1.94873046875, -1.6239013671875, -1.299072265625, -0.9742431640625, -0.6494140625, -0.3245849609375, 0.000244140625, 0.3250732421875, 0.64990234375, 0.9747314453125, 1.299560546875, 1.6243896484375, 1.94921875, 2.2740478515625, 2.598876953125, 2.9237060546875, 3.24853515625, 3.5733642578125, 3.898193359375, 4.2230224609375, 4.5478515625, 4.8726806640625, 5.197509765625, 5.5223388671875, 5.84716796875, 6.1719970703125, 6.496826171875, 6.8216552734375, 7.146484375, 7.4713134765625, 7.796142578125, 8.1209716796875, 8.44580078125, 8.7706298828125, 9.095458984375, 9.4202880859375, 9.7451171875, 10.0699462890625, 10.394775390625, 10.7196044921875, 11.04443359375, 11.3692626953125, 11.694091796875, 12.0189208984375, 12.34375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 3.0, 13.0, 12.0, 19.0, 18.0, 21.0, 41.0, 43.0, 98.0, 131.0, 155.0, 119.0, 95.0, 50.0, 39.0, 27.0, 20.0, 13.0, 12.0, 8.0, 9.0, 8.0, 1.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000873565673828125, -0.0008465796709060669, -0.0008195936679840088, -0.0007926076650619507, -0.0007656216621398926, -0.0007386356592178345, -0.0007116496562957764, -0.0006846636533737183, -0.0006576776504516602, -0.000630691647529602, -0.0006037056446075439, -0.0005767196416854858, -0.0005497336387634277, -0.0005227476358413696, -0.0004957616329193115, -0.0004687756299972534, -0.0004417896270751953, -0.0004148036241531372, -0.0003878176212310791, -0.000360831618309021, -0.0003338456153869629, -0.0003068596124649048, -0.0002798736095428467, -0.0002528876066207886, -0.00022590160369873047, -0.00019891560077667236, -0.00017192959785461426, -0.00014494359493255615, -0.00011795759201049805, -9.097158908843994e-05, -6.398558616638184e-05, -3.699958324432373e-05, -1.0013580322265625e-05, 1.697242259979248e-05, 4.3958425521850586e-05, 7.094442844390869e-05, 9.79304313659668e-05, 0.0001249164342880249, 0.000151902437210083, 0.0001788884401321411, 0.00020587444305419922, 0.00023286044597625732, 0.00025984644889831543, 0.00028683245182037354, 0.00031381845474243164, 0.00034080445766448975, 0.00036779046058654785, 0.00039477646350860596, 0.00042176246643066406, 0.00044874846935272217, 0.0004757344722747803, 0.0005027204751968384, 0.0005297064781188965, 0.0005566924810409546, 0.0005836784839630127, 0.0006106644868850708, 0.0006376504898071289, 0.000664636492729187, 0.0006916224956512451, 0.0007186084985733032, 0.0007455945014953613, 0.0007725805044174194, 0.0007995665073394775, 0.0008265525102615356, 0.0008535385131835938]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 4.0, 12.0, 17.0, 30.0, 52.0, 70.0, 125.0, 231.0, 433.0, 907.0, 2209.0, 6781.0, 26643.0, 230834.0, 699129.0, 62921.0, 11831.0, 3600.0, 1321.0, 606.0, 321.0, 181.0, 79.0, 62.0, 45.0, 26.0, 15.0, 13.0, 14.0, 10.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.82421875, -4.687286376953125, -4.55035400390625, -4.413421630859375, -4.2764892578125, -4.139556884765625, -4.00262451171875, -3.865692138671875, -3.728759765625, -3.591827392578125, -3.45489501953125, -3.317962646484375, -3.1810302734375, -3.044097900390625, -2.90716552734375, -2.770233154296875, -2.63330078125, -2.496368408203125, -2.35943603515625, -2.222503662109375, -2.0855712890625, -1.948638916015625, -1.81170654296875, -1.674774169921875, -1.537841796875, -1.400909423828125, -1.26397705078125, -1.127044677734375, -0.9901123046875, -0.853179931640625, -0.71624755859375, -0.579315185546875, -0.4423828125, -0.305450439453125, -0.16851806640625, -0.031585693359375, 0.1053466796875, 0.242279052734375, 0.37921142578125, 0.516143798828125, 0.653076171875, 0.790008544921875, 0.92694091796875, 1.063873291015625, 1.2008056640625, 1.337738037109375, 1.47467041015625, 1.611602783203125, 1.74853515625, 1.885467529296875, 2.02239990234375, 2.159332275390625, 2.2962646484375, 2.433197021484375, 2.57012939453125, 2.707061767578125, 2.843994140625, 2.980926513671875, 3.11785888671875, 3.254791259765625, 3.3917236328125, 3.528656005859375, 3.66558837890625, 3.802520751953125, 3.939453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 7.0, 8.0, 6.0, 28.0, 32.0, 35.0, 71.0, 73.0, 114.0, 100.0, 95.0, 110.0, 89.0, 63.0, 50.0, 24.0, 21.0, 10.0, 14.0, 5.0, 10.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.650390625, -3.525726318359375, -3.40106201171875, -3.276397705078125, -3.1517333984375, -3.027069091796875, -2.90240478515625, -2.777740478515625, -2.653076171875, -2.528411865234375, -2.40374755859375, -2.279083251953125, -2.1544189453125, -2.029754638671875, -1.90509033203125, -1.780426025390625, -1.65576171875, -1.531097412109375, -1.40643310546875, -1.281768798828125, -1.1571044921875, -1.032440185546875, -0.90777587890625, -0.783111572265625, -0.658447265625, -0.533782958984375, -0.40911865234375, -0.284454345703125, -0.1597900390625, -0.035125732421875, 0.08953857421875, 0.214202880859375, 0.3388671875, 0.463531494140625, 0.58819580078125, 0.712860107421875, 0.8375244140625, 0.962188720703125, 1.08685302734375, 1.211517333984375, 1.336181640625, 1.460845947265625, 1.58551025390625, 1.710174560546875, 1.8348388671875, 1.959503173828125, 2.08416748046875, 2.208831787109375, 2.33349609375, 2.458160400390625, 2.58282470703125, 2.707489013671875, 2.8321533203125, 2.956817626953125, 3.08148193359375, 3.206146240234375, 3.330810546875, 3.455474853515625, 3.58013916015625, 3.704803466796875, 3.8294677734375, 3.954132080078125, 4.07879638671875, 4.203460693359375, 4.328125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 9.0, 22.0, 142.0, 409.0, 296.0, 76.0, 21.0, 6.0, 7.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.51541137695312, -136.9225616455078, -132.32972717285156, -127.73687744140625, -123.14402770996094, -118.55118560791016, -113.95834350585938, -109.36549377441406, -104.77264404296875, -100.17980194091797, -95.58695220947266, -90.99411010742188, -86.40126037597656, -81.80841827392578, -77.215576171875, -72.62272644042969, -68.0298843383789, -63.43703842163086, -58.84419250488281, -54.25135040283203, -49.65850067138672, -45.06565856933594, -40.47281265258789, -35.879966735839844, -31.287120819091797, -26.69427490234375, -22.101428985595703, -17.50858497619629, -12.915739059448242, -8.322893142700195, -3.7300491333007812, 0.8627967834472656, 5.4556427001953125, 10.04848861694336, 14.64133358001709, 19.23417854309082, 23.827024459838867, 28.419870376586914, 33.01271438598633, 37.605560302734375, 42.19840621948242, 46.79125213623047, 51.384098052978516, 55.97694396972656, 60.569786071777344, 65.16263580322266, 69.75547790527344, 74.34832763671875, 78.94116973876953, 83.53401184082031, 88.12686157226562, 92.7197036743164, 97.31255340576172, 101.9053955078125, 106.49824523925781, 111.0910873413086, 115.68392944335938, 120.27677154541016, 124.86962127685547, 129.46246337890625, 134.05531311035156, 138.64816284179688, 143.24099731445312, 147.83384704589844, 152.42669677734375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 5.0, 15.0, 22.0, 21.0, 15.0, 20.0, 36.0, 48.0, 50.0, 55.0, 58.0, 64.0, 84.0, 73.0, 73.0, 61.0, 65.0, 46.0, 33.0, 25.0, 26.0, 31.0, 17.0, 15.0, 11.0, 7.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.01432800292969, -39.15485763549805, -37.295387268066406, -35.4359130859375, -33.57644271850586, -31.71697235107422, -29.857501983642578, -27.998031616210938, -26.138559341430664, -24.279088973999023, -22.41961669921875, -20.56014633178711, -18.70067596435547, -16.841203689575195, -14.981733322143555, -13.122262001037598, -11.26279067993164, -9.403319358825684, -7.543848514556885, -5.684377670288086, -3.824906349182129, -1.9654350280761719, -0.10596466064453125, 1.7535066604614258, 3.612977981567383, 5.47244930267334, 7.331920146942139, 9.191390991210938, 11.050862312316895, 12.910333633422852, 14.769804000854492, 16.629276275634766, 18.488746643066406, 20.348217010498047, 22.20768928527832, 24.06715965270996, 25.926631927490234, 27.786102294921875, 29.645572662353516, 31.505043029785156, 33.36451721191406, 35.2239875793457, 37.083457946777344, 38.94293212890625, 40.80240249633789, 42.66187286376953, 44.52134323120117, 46.38081359863281, 48.24028396606445, 50.099754333496094, 51.959224700927734, 53.818695068359375, 55.67816925048828, 57.53763961791992, 59.39710998535156, 61.2565803527832, 63.116050720214844, 64.97552490234375, 66.83499145507812, 68.69446563720703, 70.5539321899414, 72.41340637207031, 74.27287292480469, 76.1323471069336, 77.9918212890625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 11.0, 11.0, 11.0, 18.0, 42.0, 51.0, 89.0, 146.0, 241.0, 374.0, 727.0, 1500.0, 3123.0, 6987.0, 16712.0, 44951.0, 149081.0, 677814.0, 2072021.0, 935268.0, 197098.0, 53786.0, 19083.0, 7810.0, 3397.0, 1667.0, 960.0, 466.0, 284.0, 191.0, 120.0, 75.0, 45.0, 30.0, 26.0, 19.0, 15.0, 10.0, 2.0, 9.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.1015625, -3.014434814453125, -2.92730712890625, -2.840179443359375, -2.7530517578125, -2.665924072265625, -2.57879638671875, -2.491668701171875, -2.404541015625, -2.317413330078125, -2.23028564453125, -2.143157958984375, -2.0560302734375, -1.968902587890625, -1.88177490234375, -1.794647216796875, -1.70751953125, -1.620391845703125, -1.53326416015625, -1.446136474609375, -1.3590087890625, -1.271881103515625, -1.18475341796875, -1.097625732421875, -1.010498046875, -0.923370361328125, -0.83624267578125, -0.749114990234375, -0.6619873046875, -0.574859619140625, -0.48773193359375, -0.400604248046875, -0.3134765625, -0.226348876953125, -0.13922119140625, -0.052093505859375, 0.0350341796875, 0.122161865234375, 0.20928955078125, 0.296417236328125, 0.383544921875, 0.470672607421875, 0.55780029296875, 0.644927978515625, 0.7320556640625, 0.819183349609375, 0.90631103515625, 0.993438720703125, 1.08056640625, 1.167694091796875, 1.25482177734375, 1.341949462890625, 1.4290771484375, 1.516204833984375, 1.60333251953125, 1.690460205078125, 1.777587890625, 1.864715576171875, 1.95184326171875, 2.038970947265625, 2.1260986328125, 2.213226318359375, 2.30035400390625, 2.387481689453125, 2.474609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 14.0, 13.0, 21.0, 33.0, 40.0, 38.0, 56.0, 68.0, 57.0, 77.0, 76.0, 67.0, 82.0, 65.0, 53.0, 51.0, 37.0, 33.0, 30.0, 23.0, 18.0, 7.0, 6.0, 8.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -1.99786376953125, -1.8980712890625, -1.79827880859375, -1.698486328125, -1.59869384765625, -1.4989013671875, -1.39910888671875, -1.29931640625, -1.19952392578125, -1.0997314453125, -0.99993896484375, -0.900146484375, -0.80035400390625, -0.7005615234375, -0.60076904296875, -0.5009765625, -0.40118408203125, -0.3013916015625, -0.20159912109375, -0.101806640625, -0.00201416015625, 0.0977783203125, 0.19757080078125, 0.29736328125, 0.39715576171875, 0.4969482421875, 0.59674072265625, 0.696533203125, 0.79632568359375, 0.8961181640625, 0.99591064453125, 1.095703125, 1.19549560546875, 1.2952880859375, 1.39508056640625, 1.494873046875, 1.59466552734375, 1.6944580078125, 1.79425048828125, 1.89404296875, 1.99383544921875, 2.0936279296875, 2.19342041015625, 2.293212890625, 2.39300537109375, 2.4927978515625, 2.59259033203125, 2.6923828125, 2.79217529296875, 2.8919677734375, 2.99176025390625, 3.091552734375, 3.19134521484375, 3.2911376953125, 3.39093017578125, 3.49072265625, 3.59051513671875, 3.6903076171875, 3.79010009765625, 3.889892578125, 3.98968505859375, 4.0894775390625, 4.18927001953125, 4.2890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 5.0, 15.0, 12.0, 29.0, 26.0, 42.0, 53.0, 70.0, 97.0, 178.0, 296.0, 548.0, 1023.0, 2270.0, 5640.0, 15097.0, 47285.0, 193140.0, 1309099.0, 2186880.0, 329235.0, 69790.0, 20609.0, 7257.0, 2847.0, 1262.0, 616.0, 311.0, 172.0, 133.0, 65.0, 55.0, 40.0, 27.0, 22.0, 11.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.470672607421875, -4.33978271484375, -4.208892822265625, -4.0780029296875, -3.947113037109375, -3.81622314453125, -3.685333251953125, -3.554443359375, -3.423553466796875, -3.29266357421875, -3.161773681640625, -3.0308837890625, -2.899993896484375, -2.76910400390625, -2.638214111328125, -2.50732421875, -2.376434326171875, -2.24554443359375, -2.114654541015625, -1.9837646484375, -1.852874755859375, -1.72198486328125, -1.591094970703125, -1.460205078125, -1.329315185546875, -1.19842529296875, -1.067535400390625, -0.9366455078125, -0.805755615234375, -0.67486572265625, -0.543975830078125, -0.4130859375, -0.282196044921875, -0.15130615234375, -0.020416259765625, 0.1104736328125, 0.241363525390625, 0.37225341796875, 0.503143310546875, 0.634033203125, 0.764923095703125, 0.89581298828125, 1.026702880859375, 1.1575927734375, 1.288482666015625, 1.41937255859375, 1.550262451171875, 1.68115234375, 1.812042236328125, 1.94293212890625, 2.073822021484375, 2.2047119140625, 2.335601806640625, 2.46649169921875, 2.597381591796875, 2.728271484375, 2.859161376953125, 2.99005126953125, 3.120941162109375, 3.2518310546875, 3.382720947265625, 3.51361083984375, 3.644500732421875, 3.775390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 2.0, 4.0, 4.0, 5.0, 6.0, 5.0, 10.0, 16.0, 15.0, 25.0, 16.0, 27.0, 42.0, 57.0, 77.0, 86.0, 113.0, 173.0, 207.0, 292.0, 371.0, 435.0, 457.0, 382.0, 291.0, 242.0, 158.0, 114.0, 111.0, 71.0, 54.0, 51.0, 42.0, 25.0, 17.0, 14.0, 7.0, 10.0, 8.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.53515625, -4.39373779296875, -4.2523193359375, -4.11090087890625, -3.969482421875, -3.82806396484375, -3.6866455078125, -3.54522705078125, -3.40380859375, -3.26239013671875, -3.1209716796875, -2.97955322265625, -2.838134765625, -2.69671630859375, -2.5552978515625, -2.41387939453125, -2.2724609375, -2.13104248046875, -1.9896240234375, -1.84820556640625, -1.706787109375, -1.56536865234375, -1.4239501953125, -1.28253173828125, -1.14111328125, -0.99969482421875, -0.8582763671875, -0.71685791015625, -0.575439453125, -0.43402099609375, -0.2926025390625, -0.15118408203125, -0.009765625, 0.13165283203125, 0.2730712890625, 0.41448974609375, 0.555908203125, 0.69732666015625, 0.8387451171875, 0.98016357421875, 1.12158203125, 1.26300048828125, 1.4044189453125, 1.54583740234375, 1.687255859375, 1.82867431640625, 1.9700927734375, 2.11151123046875, 2.2529296875, 2.39434814453125, 2.5357666015625, 2.67718505859375, 2.818603515625, 2.96002197265625, 3.1014404296875, 3.24285888671875, 3.38427734375, 3.52569580078125, 3.6671142578125, 3.80853271484375, 3.949951171875, 4.09136962890625, 4.2327880859375, 4.37420654296875, 4.515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 10.0, 32.0, 116.0, 233.0, 294.0, 185.0, 74.0, 26.0, 4.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.46976852416992, -52.22914505004883, -48.988525390625, -45.747901916503906, -42.50727844238281, -39.26665496826172, -36.02603530883789, -32.7854118347168, -29.544790267944336, -26.304168701171875, -23.06354522705078, -19.82292366027832, -16.58230209350586, -13.341678619384766, -10.101057052612305, -6.860433578491211, -3.61981201171875, -0.37918972969055176, 2.8614325523376465, 6.102054595947266, 9.342677116394043, 12.58329963684082, 15.823921203613281, 19.064544677734375, 22.305166244506836, 25.545787811279297, 28.78641128540039, 32.02703094482422, 35.26765441894531, 38.508277893066406, 41.7489013671875, 44.989524841308594, 48.230140686035156, 51.47076416015625, 54.71138381958008, 57.95200729370117, 61.192630767822266, 64.4332504272461, 67.67387390136719, 70.91449737548828, 74.15512084960938, 77.39574432373047, 80.63636779785156, 83.87698364257812, 87.11760711669922, 90.35823059082031, 93.5988540649414, 96.8394775390625, 100.08009338378906, 103.32071685791016, 106.56134033203125, 109.80195617675781, 113.0425796508789, 116.283203125, 119.5238265991211, 122.76445007324219, 126.00507354736328, 129.24569702148438, 132.48631286621094, 135.72694396972656, 138.96755981445312, 142.20819091796875, 145.4488067626953, 148.68942260742188, 151.9300537109375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 1.0, 8.0, 11.0, 15.0, 14.0, 16.0, 27.0, 24.0, 38.0, 33.0, 43.0, 36.0, 57.0, 41.0, 50.0, 60.0, 51.0, 51.0, 57.0, 45.0, 42.0, 44.0, 39.0, 31.0, 30.0, 33.0, 27.0, 13.0, 20.0, 7.0, 6.0, 8.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.03376007080078, -41.823997497558594, -40.614234924316406, -39.40447235107422, -38.19470977783203, -36.984947204589844, -35.775184631347656, -34.56542205810547, -33.35565948486328, -32.145896911621094, -30.936134338378906, -29.72637176513672, -28.51660919189453, -27.306846618652344, -26.097084045410156, -24.88732147216797, -23.67755889892578, -22.467796325683594, -21.258033752441406, -20.04827117919922, -18.83850860595703, -17.628746032714844, -16.418983459472656, -15.209220886230469, -13.999458312988281, -12.789695739746094, -11.579933166503906, -10.370170593261719, -9.160408020019531, -7.950645446777344, -6.740882873535156, -5.531120300292969, -4.321357727050781, -3.1115951538085938, -1.9018325805664062, -0.6920700073242188, 0.5176925659179688, 1.7274551391601562, 2.9372177124023438, 4.146980285644531, 5.356742858886719, 6.566505432128906, 7.776268005371094, 8.986030578613281, 10.195793151855469, 11.405555725097656, 12.615318298339844, 13.825080871582031, 15.034843444824219, 16.244606018066406, 17.454368591308594, 18.66413116455078, 19.87389373779297, 21.083656311035156, 22.293418884277344, 23.50318145751953, 24.71294403076172, 25.922706604003906, 27.132469177246094, 28.34223175048828, 29.55199432373047, 30.761756896972656, 31.971519470214844, 33.18128204345703, 34.39104461669922]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 8.0, 9.0, 12.0, 14.0, 13.0, 23.0, 34.0, 53.0, 81.0, 140.0, 217.0, 290.0, 548.0, 990.0, 1801.0, 3257.0, 6419.0, 12933.0, 27051.0, 59208.0, 144324.0, 348216.0, 260417.0, 98839.0, 43022.0, 20252.0, 9670.0, 4811.0, 2526.0, 1372.0, 719.0, 455.0, 273.0, 198.0, 117.0, 68.0, 56.0, 40.0, 20.0, 19.0, 12.0, 10.0, 5.0, 5.0, 8.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.19921875, -4.074981689453125, -3.95074462890625, -3.826507568359375, -3.7022705078125, -3.578033447265625, -3.45379638671875, -3.329559326171875, -3.205322265625, -3.081085205078125, -2.95684814453125, -2.832611083984375, -2.7083740234375, -2.584136962890625, -2.45989990234375, -2.335662841796875, -2.21142578125, -2.087188720703125, -1.96295166015625, -1.838714599609375, -1.7144775390625, -1.590240478515625, -1.46600341796875, -1.341766357421875, -1.217529296875, -1.093292236328125, -0.96905517578125, -0.844818115234375, -0.7205810546875, -0.596343994140625, -0.47210693359375, -0.347869873046875, -0.2236328125, -0.099395751953125, 0.02484130859375, 0.149078369140625, 0.2733154296875, 0.397552490234375, 0.52178955078125, 0.646026611328125, 0.770263671875, 0.894500732421875, 1.01873779296875, 1.142974853515625, 1.2672119140625, 1.391448974609375, 1.51568603515625, 1.639923095703125, 1.76416015625, 1.888397216796875, 2.01263427734375, 2.136871337890625, 2.2611083984375, 2.385345458984375, 2.50958251953125, 2.633819580078125, 2.758056640625, 2.882293701171875, 3.00653076171875, 3.130767822265625, 3.2550048828125, 3.379241943359375, 3.50347900390625, 3.627716064453125, 3.751953125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 14.0, 16.0, 15.0, 14.0, 30.0, 20.0, 24.0, 31.0, 31.0, 38.0, 52.0, 46.0, 53.0, 43.0, 60.0, 46.0, 39.0, 56.0, 41.0, 33.0, 30.0, 38.0, 42.0, 30.0, 28.0, 16.0, 15.0, 15.0, 9.0, 11.0, 16.0, 6.0, 2.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.07421875, -2.004913330078125, -1.93560791015625, -1.866302490234375, -1.7969970703125, -1.727691650390625, -1.65838623046875, -1.589080810546875, -1.519775390625, -1.450469970703125, -1.38116455078125, -1.311859130859375, -1.2425537109375, -1.173248291015625, -1.10394287109375, -1.034637451171875, -0.96533203125, -0.896026611328125, -0.82672119140625, -0.757415771484375, -0.6881103515625, -0.618804931640625, -0.54949951171875, -0.480194091796875, -0.410888671875, -0.341583251953125, -0.27227783203125, -0.202972412109375, -0.1336669921875, -0.064361572265625, 0.00494384765625, 0.074249267578125, 0.1435546875, 0.212860107421875, 0.28216552734375, 0.351470947265625, 0.4207763671875, 0.490081787109375, 0.55938720703125, 0.628692626953125, 0.697998046875, 0.767303466796875, 0.83660888671875, 0.905914306640625, 0.9752197265625, 1.044525146484375, 1.11383056640625, 1.183135986328125, 1.25244140625, 1.321746826171875, 1.39105224609375, 1.460357666015625, 1.5296630859375, 1.598968505859375, 1.66827392578125, 1.737579345703125, 1.806884765625, 1.876190185546875, 1.94549560546875, 2.014801025390625, 2.0841064453125, 2.153411865234375, 2.22271728515625, 2.292022705078125, 2.361328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 15.0, 15.0, 16.0, 31.0, 44.0, 55.0, 92.0, 97.0, 150.0, 233.0, 347.0, 547.0, 918.0, 1732.0, 3254.0, 8093.0, 31733.0, 243480.0, 674348.0, 61136.0, 12507.0, 4479.0, 2066.0, 1120.0, 689.0, 419.0, 318.0, 188.0, 124.0, 102.0, 57.0, 42.0, 27.0, 21.0, 14.0, 15.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-10.6171875, -10.2972412109375, -9.977294921875, -9.6573486328125, -9.33740234375, -9.0174560546875, -8.697509765625, -8.3775634765625, -8.0576171875, -7.7376708984375, -7.417724609375, -7.0977783203125, -6.77783203125, -6.4578857421875, -6.137939453125, -5.8179931640625, -5.498046875, -5.1781005859375, -4.858154296875, -4.5382080078125, -4.21826171875, -3.8983154296875, -3.578369140625, -3.2584228515625, -2.9384765625, -2.6185302734375, -2.298583984375, -1.9786376953125, -1.65869140625, -1.3387451171875, -1.018798828125, -0.6988525390625, -0.37890625, -0.0589599609375, 0.260986328125, 0.5809326171875, 0.90087890625, 1.2208251953125, 1.540771484375, 1.8607177734375, 2.1806640625, 2.5006103515625, 2.820556640625, 3.1405029296875, 3.46044921875, 3.7803955078125, 4.100341796875, 4.4202880859375, 4.740234375, 5.0601806640625, 5.380126953125, 5.7000732421875, 6.02001953125, 6.3399658203125, 6.659912109375, 6.9798583984375, 7.2998046875, 7.6197509765625, 7.939697265625, 8.2596435546875, 8.57958984375, 8.8995361328125, 9.219482421875, 9.5394287109375, 9.859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 12.0, 15.0, 10.0, 15.0, 29.0, 20.0, 30.0, 23.0, 35.0, 38.0, 51.0, 73.0, 56.0, 56.0, 56.0, 54.0, 50.0, 51.0, 49.0, 44.0, 42.0, 33.0, 31.0, 24.0, 16.0, 18.0, 14.0, 13.0, 12.0, 3.0, 5.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.4239501953125, -12.011962890625, -11.5999755859375, -11.18798828125, -10.7760009765625, -10.364013671875, -9.9520263671875, -9.5400390625, -9.1280517578125, -8.716064453125, -8.3040771484375, -7.89208984375, -7.4801025390625, -7.068115234375, -6.6561279296875, -6.244140625, -5.8321533203125, -5.420166015625, -5.0081787109375, -4.59619140625, -4.1842041015625, -3.772216796875, -3.3602294921875, -2.9482421875, -2.5362548828125, -2.124267578125, -1.7122802734375, -1.30029296875, -0.8883056640625, -0.476318359375, -0.0643310546875, 0.34765625, 0.7596435546875, 1.171630859375, 1.5836181640625, 1.99560546875, 2.4075927734375, 2.819580078125, 3.2315673828125, 3.6435546875, 4.0555419921875, 4.467529296875, 4.8795166015625, 5.29150390625, 5.7034912109375, 6.115478515625, 6.5274658203125, 6.939453125, 7.3514404296875, 7.763427734375, 8.1754150390625, 8.58740234375, 8.9993896484375, 9.411376953125, 9.8233642578125, 10.2353515625, 10.6473388671875, 11.059326171875, 11.4713134765625, 11.88330078125, 12.2952880859375, 12.707275390625, 13.1192626953125, 13.53125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 10.0, 15.0, 17.0, 18.0, 29.0, 30.0, 54.0, 91.0, 126.0, 214.0, 373.0, 741.0, 1648.0, 4291.0, 14631.0, 62490.0, 514413.0, 370240.0, 57878.0, 13753.0, 4224.0, 1585.0, 745.0, 369.0, 191.0, 128.0, 55.0, 50.0, 42.0, 30.0, 14.0, 10.0, 12.0, 6.0, 4.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.14453125, -4.029327392578125, -3.91412353515625, -3.798919677734375, -3.6837158203125, -3.568511962890625, -3.45330810546875, -3.338104248046875, -3.222900390625, -3.107696533203125, -2.99249267578125, -2.877288818359375, -2.7620849609375, -2.646881103515625, -2.53167724609375, -2.416473388671875, -2.30126953125, -2.186065673828125, -2.07086181640625, -1.955657958984375, -1.8404541015625, -1.725250244140625, -1.61004638671875, -1.494842529296875, -1.379638671875, -1.264434814453125, -1.14923095703125, -1.034027099609375, -0.9188232421875, -0.803619384765625, -0.68841552734375, -0.573211669921875, -0.4580078125, -0.342803955078125, -0.22760009765625, -0.112396240234375, 0.0028076171875, 0.118011474609375, 0.23321533203125, 0.348419189453125, 0.463623046875, 0.578826904296875, 0.69403076171875, 0.809234619140625, 0.9244384765625, 1.039642333984375, 1.15484619140625, 1.270050048828125, 1.38525390625, 1.500457763671875, 1.61566162109375, 1.730865478515625, 1.8460693359375, 1.961273193359375, 2.07647705078125, 2.191680908203125, 2.306884765625, 2.422088623046875, 2.53729248046875, 2.652496337890625, 2.7677001953125, 2.882904052734375, 2.99810791015625, 3.113311767578125, 3.228515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 5.0, 6.0, 8.0, 9.0, 13.0, 22.0, 20.0, 22.0, 23.0, 48.0, 33.0, 52.0, 92.0, 153.0, 107.0, 79.0, 50.0, 52.0, 30.0, 28.0, 26.0, 20.0, 19.0, 17.0, 8.0, 9.0, 13.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008449554443359375, -0.0008155107498168945, -0.0007860660552978516, -0.0007566213607788086, -0.0007271766662597656, -0.0006977319717407227, -0.0006682872772216797, -0.0006388425827026367, -0.0006093978881835938, -0.0005799531936645508, -0.0005505084991455078, -0.0005210638046264648, -0.0004916191101074219, -0.0004621744155883789, -0.00043272972106933594, -0.00040328502655029297, -0.00037384033203125, -0.00034439563751220703, -0.00031495094299316406, -0.0002855062484741211, -0.0002560615539550781, -0.00022661685943603516, -0.0001971721649169922, -0.00016772747039794922, -0.00013828277587890625, -0.00010883808135986328, -7.939338684082031e-05, -4.9948692321777344e-05, -2.0503997802734375e-05, 8.940696716308594e-06, 3.838539123535156e-05, 6.783008575439453e-05, 9.72747802734375e-05, 0.00012671947479248047, 0.00015616416931152344, 0.0001856088638305664, 0.00021505355834960938, 0.00024449825286865234, 0.0002739429473876953, 0.0003033876419067383, 0.00033283233642578125, 0.0003622770309448242, 0.0003917217254638672, 0.00042116641998291016, 0.0004506111145019531, 0.0004800558090209961, 0.0005095005035400391, 0.000538945198059082, 0.000568389892578125, 0.000597834587097168, 0.0006272792816162109, 0.0006567239761352539, 0.0006861686706542969, 0.0007156133651733398, 0.0007450580596923828, 0.0007745027542114258, 0.0008039474487304688, 0.0008333921432495117, 0.0008628368377685547, 0.0008922815322875977, 0.0009217262268066406, 0.0009511709213256836, 0.0009806156158447266, 0.0010100603103637695, 0.0010395050048828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 12.0, 12.0, 12.0, 22.0, 39.0, 59.0, 60.0, 88.0, 126.0, 214.0, 346.0, 535.0, 874.0, 1622.0, 2954.0, 6235.0, 16333.0, 59606.0, 337268.0, 520095.0, 69091.0, 18665.0, 6899.0, 3095.0, 1710.0, 949.0, 546.0, 359.0, 237.0, 132.0, 97.0, 62.0, 49.0, 35.0, 33.0, 19.0, 14.0, 10.0, 10.0, 3.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-3.52734375, -3.42950439453125, -3.3316650390625, -3.23382568359375, -3.135986328125, -3.03814697265625, -2.9403076171875, -2.84246826171875, -2.74462890625, -2.64678955078125, -2.5489501953125, -2.45111083984375, -2.353271484375, -2.25543212890625, -2.1575927734375, -2.05975341796875, -1.9619140625, -1.86407470703125, -1.7662353515625, -1.66839599609375, -1.570556640625, -1.47271728515625, -1.3748779296875, -1.27703857421875, -1.17919921875, -1.08135986328125, -0.9835205078125, -0.88568115234375, -0.787841796875, -0.69000244140625, -0.5921630859375, -0.49432373046875, -0.396484375, -0.29864501953125, -0.2008056640625, -0.10296630859375, -0.005126953125, 0.09271240234375, 0.1905517578125, 0.28839111328125, 0.38623046875, 0.48406982421875, 0.5819091796875, 0.67974853515625, 0.777587890625, 0.87542724609375, 0.9732666015625, 1.07110595703125, 1.1689453125, 1.26678466796875, 1.3646240234375, 1.46246337890625, 1.560302734375, 1.65814208984375, 1.7559814453125, 1.85382080078125, 1.95166015625, 2.04949951171875, 2.1473388671875, 2.24517822265625, 2.343017578125, 2.44085693359375, 2.5386962890625, 2.63653564453125, 2.734375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 1.0, 3.0, 12.0, 10.0, 14.0, 30.0, 34.0, 18.0, 29.0, 55.0, 53.0, 80.0, 104.0, 110.0, 112.0, 70.0, 55.0, 39.0, 29.0, 33.0, 24.0, 18.0, 13.0, 15.0, 8.0, 9.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.71484375, -3.600250244140625, -3.48565673828125, -3.371063232421875, -3.2564697265625, -3.141876220703125, -3.02728271484375, -2.912689208984375, -2.798095703125, -2.683502197265625, -2.56890869140625, -2.454315185546875, -2.3397216796875, -2.225128173828125, -2.11053466796875, -1.995941162109375, -1.88134765625, -1.766754150390625, -1.65216064453125, -1.537567138671875, -1.4229736328125, -1.308380126953125, -1.19378662109375, -1.079193115234375, -0.964599609375, -0.850006103515625, -0.73541259765625, -0.620819091796875, -0.5062255859375, -0.391632080078125, -0.27703857421875, -0.162445068359375, -0.0478515625, 0.066741943359375, 0.18133544921875, 0.295928955078125, 0.4105224609375, 0.525115966796875, 0.63970947265625, 0.754302978515625, 0.868896484375, 0.983489990234375, 1.09808349609375, 1.212677001953125, 1.3272705078125, 1.441864013671875, 1.55645751953125, 1.671051025390625, 1.78564453125, 1.900238037109375, 2.01483154296875, 2.129425048828125, 2.2440185546875, 2.358612060546875, 2.47320556640625, 2.587799072265625, 2.702392578125, 2.816986083984375, 2.93157958984375, 3.046173095703125, 3.1607666015625, 3.275360107421875, 3.38995361328125, 3.504547119140625, 3.619140625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 11.0, 16.0, 40.0, 110.0, 183.0, 276.0, 172.0, 90.0, 39.0, 24.0, 13.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.4699935913086, -74.7429428100586, -72.01588439941406, -69.28883361816406, -66.56177520751953, -63.83472442626953, -61.107669830322266, -58.380615234375, -55.653564453125, -52.926509857177734, -50.19945526123047, -47.47240447998047, -44.7453498840332, -42.01829528808594, -39.29124069213867, -36.564186096191406, -33.83713150024414, -31.110076904296875, -28.383024215698242, -25.655969619750977, -22.928916931152344, -20.201862335205078, -17.474807739257812, -14.74775505065918, -12.020700454711914, -9.293646812438965, -6.566592693328857, -3.83953857421875, -1.1124849319458008, 1.6145687103271484, 4.341623306274414, 7.068675994873047, 9.795730590820312, 12.522784233093262, 15.249837875366211, 17.976892471313477, 20.70394515991211, 23.430999755859375, 26.15805435180664, 28.885107040405273, 31.61216163635254, 34.33921432495117, 37.06626892089844, 39.7933235168457, 42.52037811279297, 45.24742889404297, 47.9744873046875, 50.7015380859375, 53.428592681884766, 56.15564727783203, 58.8827018737793, 61.60975646972656, 64.33680725097656, 67.06385803222656, 69.7909164428711, 72.5179672241211, 75.24502563476562, 77.97207641601562, 80.69913482666016, 83.42618560791016, 86.15324401855469, 88.88029479980469, 91.60734558105469, 94.33440399169922, 97.06145477294922]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 8.0, 12.0, 8.0, 14.0, 16.0, 13.0, 13.0, 16.0, 28.0, 26.0, 28.0, 31.0, 30.0, 32.0, 39.0, 49.0, 42.0, 53.0, 59.0, 58.0, 44.0, 38.0, 39.0, 36.0, 22.0, 26.0, 27.0, 26.0, 15.0, 17.0, 24.0, 15.0, 17.0, 11.0, 15.0, 9.0, 8.0, 8.0, 0.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-33.903533935546875, -32.78506088256836, -31.66658592224121, -30.548110961914062, -29.429637908935547, -28.3111629486084, -27.19268798828125, -26.074214935302734, -24.955739974975586, -23.837265014648438, -22.718791961669922, -21.600317001342773, -20.481842041015625, -19.36336898803711, -18.24489402770996, -17.126419067382812, -16.007946014404297, -14.889472007751465, -13.770998001098633, -12.652523040771484, -11.534049034118652, -10.41557502746582, -9.297100067138672, -8.17862606048584, -7.060152053833008, -5.941678047180176, -4.8232035636901855, -3.7047293186187744, -2.5862550735473633, -1.4677810668945312, -0.349306583404541, 0.7691679000854492, 1.8876457214355469, 3.006119966506958, 4.124594211578369, 5.243068695068359, 6.361542701721191, 7.480016708374023, 8.598491668701172, 9.716965675354004, 10.835439682006836, 11.953913688659668, 13.0723876953125, 14.190862655639648, 15.30933666229248, 16.427810668945312, 17.54628562927246, 18.66476058959961, 19.783233642578125, 20.901708602905273, 22.02018165588379, 23.138656616210938, 24.257129669189453, 25.3756046295166, 26.49407958984375, 27.612552642822266, 28.731027603149414, 29.849502563476562, 30.967975616455078, 32.086448669433594, 33.204925537109375, 34.32339859008789, 35.441871643066406, 36.56034851074219, 37.6788215637207]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 5.0, 1.0, 9.0, 8.0, 10.0, 18.0, 25.0, 35.0, 37.0, 66.0, 142.0, 212.0, 394.0, 940.0, 2310.0, 7304.0, 31381.0, 222717.0, 2568015.0, 1234930.0, 99976.0, 17986.0, 4668.0, 1603.0, 732.0, 305.0, 151.0, 103.0, 61.0, 42.0, 26.0, 21.0, 14.0, 14.0, 8.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.21484375, -5.0650634765625, -4.915283203125, -4.7655029296875, -4.61572265625, -4.4659423828125, -4.316162109375, -4.1663818359375, -4.0166015625, -3.8668212890625, -3.717041015625, -3.5672607421875, -3.41748046875, -3.2677001953125, -3.117919921875, -2.9681396484375, -2.818359375, -2.6685791015625, -2.518798828125, -2.3690185546875, -2.21923828125, -2.0694580078125, -1.919677734375, -1.7698974609375, -1.6201171875, -1.4703369140625, -1.320556640625, -1.1707763671875, -1.02099609375, -0.8712158203125, -0.721435546875, -0.5716552734375, -0.421875, -0.2720947265625, -0.122314453125, 0.0274658203125, 0.17724609375, 0.3270263671875, 0.476806640625, 0.6265869140625, 0.7763671875, 0.9261474609375, 1.075927734375, 1.2257080078125, 1.37548828125, 1.5252685546875, 1.675048828125, 1.8248291015625, 1.974609375, 2.1243896484375, 2.274169921875, 2.4239501953125, 2.57373046875, 2.7235107421875, 2.873291015625, 3.0230712890625, 3.1728515625, 3.3226318359375, 3.472412109375, 3.6221923828125, 3.77197265625, 3.9217529296875, 4.071533203125, 4.2213134765625, 4.37109375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 11.0, 13.0, 8.0, 19.0, 19.0, 35.0, 35.0, 17.0, 36.0, 40.0, 43.0, 45.0, 69.0, 58.0, 51.0, 54.0, 43.0, 57.0, 49.0, 53.0, 55.0, 36.0, 22.0, 28.0, 17.0, 18.0, 15.0, 20.0, 4.0, 11.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.376953125, -2.29669189453125, -2.2164306640625, -2.13616943359375, -2.055908203125, -1.97564697265625, -1.8953857421875, -1.81512451171875, -1.73486328125, -1.65460205078125, -1.5743408203125, -1.49407958984375, -1.413818359375, -1.33355712890625, -1.2532958984375, -1.17303466796875, -1.0927734375, -1.01251220703125, -0.9322509765625, -0.85198974609375, -0.771728515625, -0.69146728515625, -0.6112060546875, -0.53094482421875, -0.45068359375, -0.37042236328125, -0.2901611328125, -0.20989990234375, -0.129638671875, -0.04937744140625, 0.0308837890625, 0.11114501953125, 0.19140625, 0.27166748046875, 0.3519287109375, 0.43218994140625, 0.512451171875, 0.59271240234375, 0.6729736328125, 0.75323486328125, 0.83349609375, 0.91375732421875, 0.9940185546875, 1.07427978515625, 1.154541015625, 1.23480224609375, 1.3150634765625, 1.39532470703125, 1.4755859375, 1.55584716796875, 1.6361083984375, 1.71636962890625, 1.796630859375, 1.87689208984375, 1.9571533203125, 2.03741455078125, 2.11767578125, 2.19793701171875, 2.2781982421875, 2.35845947265625, 2.438720703125, 2.51898193359375, 2.5992431640625, 2.67950439453125, 2.759765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 17.0, 17.0, 36.0, 41.0, 59.0, 93.0, 147.0, 195.0, 332.0, 501.0, 874.0, 1624.0, 3498.0, 9568.0, 30755.0, 131816.0, 1080732.0, 2539819.0, 316964.0, 53803.0, 14106.0, 4801.0, 2015.0, 992.0, 562.0, 324.0, 184.0, 136.0, 79.0, 51.0, 41.0, 20.0, 19.0, 13.0, 4.0, 3.0, 1.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.65234375, -4.50341796875, -4.3544921875, -4.20556640625, -4.056640625, -3.90771484375, -3.7587890625, -3.60986328125, -3.4609375, -3.31201171875, -3.1630859375, -3.01416015625, -2.865234375, -2.71630859375, -2.5673828125, -2.41845703125, -2.26953125, -2.12060546875, -1.9716796875, -1.82275390625, -1.673828125, -1.52490234375, -1.3759765625, -1.22705078125, -1.078125, -0.92919921875, -0.7802734375, -0.63134765625, -0.482421875, -0.33349609375, -0.1845703125, -0.03564453125, 0.11328125, 0.26220703125, 0.4111328125, 0.56005859375, 0.708984375, 0.85791015625, 1.0068359375, 1.15576171875, 1.3046875, 1.45361328125, 1.6025390625, 1.75146484375, 1.900390625, 2.04931640625, 2.1982421875, 2.34716796875, 2.49609375, 2.64501953125, 2.7939453125, 2.94287109375, 3.091796875, 3.24072265625, 3.3896484375, 3.53857421875, 3.6875, 3.83642578125, 3.9853515625, 4.13427734375, 4.283203125, 4.43212890625, 4.5810546875, 4.72998046875, 4.87890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 7.0, 9.0, 14.0, 33.0, 34.0, 53.0, 66.0, 111.0, 201.0, 304.0, 500.0, 689.0, 703.0, 530.0, 307.0, 190.0, 116.0, 72.0, 48.0, 20.0, 18.0, 15.0, 12.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -8.04400634765625, -7.8145751953125, -7.58514404296875, -7.355712890625, -7.12628173828125, -6.8968505859375, -6.66741943359375, -6.43798828125, -6.20855712890625, -5.9791259765625, -5.74969482421875, -5.520263671875, -5.29083251953125, -5.0614013671875, -4.83197021484375, -4.6025390625, -4.37310791015625, -4.1436767578125, -3.91424560546875, -3.684814453125, -3.45538330078125, -3.2259521484375, -2.99652099609375, -2.76708984375, -2.53765869140625, -2.3082275390625, -2.07879638671875, -1.849365234375, -1.61993408203125, -1.3905029296875, -1.16107177734375, -0.931640625, -0.70220947265625, -0.4727783203125, -0.24334716796875, -0.013916015625, 0.21551513671875, 0.4449462890625, 0.67437744140625, 0.90380859375, 1.13323974609375, 1.3626708984375, 1.59210205078125, 1.821533203125, 2.05096435546875, 2.2803955078125, 2.50982666015625, 2.7392578125, 2.96868896484375, 3.1981201171875, 3.42755126953125, 3.656982421875, 3.88641357421875, 4.1158447265625, 4.34527587890625, 4.57470703125, 4.80413818359375, 5.0335693359375, 5.26300048828125, 5.492431640625, 5.72186279296875, 5.9512939453125, 6.18072509765625, 6.41015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 3.0, 4.0, 10.0, 25.0, 70.0, 216.0, 337.0, 237.0, 65.0, 23.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.3163070678711, -115.5395278930664, -111.76274871826172, -107.98596954345703, -104.20919036865234, -100.43241119384766, -96.6556396484375, -92.87886047363281, -89.10208129882812, -85.32530212402344, -81.54852294921875, -77.77174377441406, -73.99496459960938, -70.21818542480469, -66.44140625, -62.66463088989258, -58.887847900390625, -55.11106872558594, -51.33428955078125, -47.55751037597656, -43.780731201171875, -40.00395202636719, -36.227176666259766, -32.45039749145508, -28.67361831665039, -24.896839141845703, -21.120059967041016, -17.34328269958496, -13.566503524780273, -9.789724349975586, -6.012947082519531, -2.2361679077148438, 1.5406036376953125, 5.317382335662842, 9.094161033630371, 12.870939254760742, 16.64771842956543, 20.424497604370117, 24.201274871826172, 27.97805404663086, 31.754833221435547, 35.531612396240234, 39.30839157104492, 43.085166931152344, 46.86194610595703, 50.63872528076172, 54.415504455566406, 58.192283630371094, 61.96906280517578, 65.74584197998047, 69.52262115478516, 73.29940032958984, 77.07617950439453, 80.85295867919922, 84.62973022460938, 88.40650939941406, 92.18328857421875, 95.96006774902344, 99.73684692382812, 103.51362609863281, 107.2904052734375, 111.06718444824219, 114.84396362304688, 118.62074279785156, 122.39752197265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 14.0, 8.0, 7.0, 11.0, 18.0, 22.0, 22.0, 33.0, 31.0, 32.0, 25.0, 36.0, 38.0, 41.0, 42.0, 38.0, 65.0, 55.0, 33.0, 54.0, 44.0, 50.0, 39.0, 35.0, 37.0, 34.0, 24.0, 25.0, 12.0, 11.0, 6.0, 9.0, 8.0, 4.0, 7.0, 4.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-32.31354904174805, -31.44346809387207, -30.57338523864746, -29.703304290771484, -28.833221435546875, -27.9631404876709, -27.09305763244629, -26.222976684570312, -25.352893829345703, -24.482812881469727, -23.612730026245117, -22.74264907836914, -21.87256622314453, -21.002485275268555, -20.132402420043945, -19.26232147216797, -18.39223861694336, -17.522157669067383, -16.652074813842773, -15.78199291229248, -14.911911010742188, -14.041830062866211, -13.171747207641602, -12.301666259765625, -11.431585311889648, -10.561503410339355, -9.691421508789062, -8.82133960723877, -7.951257705688477, -7.081176280975342, -6.211094379425049, -5.341012477874756, -4.470930099487305, -3.6008481979370117, -2.7307662963867188, -1.8606846332550049, -0.9906027317047119, -0.12052106857299805, 0.7495608329772949, 1.619642734527588, 2.489724636077881, 3.359806537628174, 4.229888439178467, 5.099969863891602, 5.9700517654418945, 6.8401336669921875, 7.7102155685424805, 8.580297470092773, 9.450379371643066, 10.32046127319336, 11.190543174743652, 12.060625076293945, 12.930706977844238, 13.800788879394531, 14.670869827270508, 15.540952682495117, 16.411033630371094, 17.28111457824707, 18.15119743347168, 19.021278381347656, 19.891361236572266, 20.761442184448242, 21.63152503967285, 22.501605987548828, 23.371688842773438]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 8.0, 4.0, 7.0, 9.0, 5.0, 17.0, 23.0, 33.0, 56.0, 71.0, 150.0, 288.0, 470.0, 1091.0, 2329.0, 5956.0, 16992.0, 63527.0, 385158.0, 463321.0, 77673.0, 19683.0, 6649.0, 2624.0, 1102.0, 577.0, 294.0, 161.0, 85.0, 62.0, 33.0, 23.0, 17.0, 16.0, 16.0, 6.0, 8.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2265625, -7.014404296875, -6.80224609375, -6.590087890625, -6.3779296875, -6.165771484375, -5.95361328125, -5.741455078125, -5.529296875, -5.317138671875, -5.10498046875, -4.892822265625, -4.6806640625, -4.468505859375, -4.25634765625, -4.044189453125, -3.83203125, -3.619873046875, -3.40771484375, -3.195556640625, -2.9833984375, -2.771240234375, -2.55908203125, -2.346923828125, -2.134765625, -1.922607421875, -1.71044921875, -1.498291015625, -1.2861328125, -1.073974609375, -0.86181640625, -0.649658203125, -0.4375, -0.225341796875, -0.01318359375, 0.198974609375, 0.4111328125, 0.623291015625, 0.83544921875, 1.047607421875, 1.259765625, 1.471923828125, 1.68408203125, 1.896240234375, 2.1083984375, 2.320556640625, 2.53271484375, 2.744873046875, 2.95703125, 3.169189453125, 3.38134765625, 3.593505859375, 3.8056640625, 4.017822265625, 4.22998046875, 4.442138671875, 4.654296875, 4.866455078125, 5.07861328125, 5.290771484375, 5.5029296875, 5.715087890625, 5.92724609375, 6.139404296875, 6.3515625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 2.0, 7.0, 5.0, 5.0, 7.0, 3.0, 13.0, 9.0, 8.0, 16.0, 16.0, 18.0, 23.0, 30.0, 32.0, 47.0, 36.0, 43.0, 46.0, 37.0, 56.0, 50.0, 51.0, 48.0, 48.0, 51.0, 45.0, 40.0, 28.0, 28.0, 29.0, 17.0, 26.0, 18.0, 14.0, 12.0, 12.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.314453125, -2.2410888671875, -2.167724609375, -2.0943603515625, -2.02099609375, -1.9476318359375, -1.874267578125, -1.8009033203125, -1.7275390625, -1.6541748046875, -1.580810546875, -1.5074462890625, -1.43408203125, -1.3607177734375, -1.287353515625, -1.2139892578125, -1.140625, -1.0672607421875, -0.993896484375, -0.9205322265625, -0.84716796875, -0.7738037109375, -0.700439453125, -0.6270751953125, -0.5537109375, -0.4803466796875, -0.406982421875, -0.3336181640625, -0.26025390625, -0.1868896484375, -0.113525390625, -0.0401611328125, 0.033203125, 0.1065673828125, 0.179931640625, 0.2532958984375, 0.32666015625, 0.4000244140625, 0.473388671875, 0.5467529296875, 0.6201171875, 0.6934814453125, 0.766845703125, 0.8402099609375, 0.91357421875, 0.9869384765625, 1.060302734375, 1.1336669921875, 1.20703125, 1.2803955078125, 1.353759765625, 1.4271240234375, 1.50048828125, 1.5738525390625, 1.647216796875, 1.7205810546875, 1.7939453125, 1.8673095703125, 1.940673828125, 2.0140380859375, 2.08740234375, 2.1607666015625, 2.234130859375, 2.3074951171875, 2.380859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 10.0, 6.0, 10.0, 22.0, 39.0, 54.0, 74.0, 101.0, 178.0, 282.0, 588.0, 1252.0, 3350.0, 13657.0, 143465.0, 831195.0, 43265.0, 6923.0, 2167.0, 887.0, 398.0, 209.0, 136.0, 87.0, 57.0, 40.0, 27.0, 15.0, 17.0, 10.0, 8.0, 7.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8984375, -13.4542236328125, -13.010009765625, -12.5657958984375, -12.12158203125, -11.6773681640625, -11.233154296875, -10.7889404296875, -10.3447265625, -9.9005126953125, -9.456298828125, -9.0120849609375, -8.56787109375, -8.1236572265625, -7.679443359375, -7.2352294921875, -6.791015625, -6.3468017578125, -5.902587890625, -5.4583740234375, -5.01416015625, -4.5699462890625, -4.125732421875, -3.6815185546875, -3.2373046875, -2.7930908203125, -2.348876953125, -1.9046630859375, -1.46044921875, -1.0162353515625, -0.572021484375, -0.1278076171875, 0.31640625, 0.7606201171875, 1.204833984375, 1.6490478515625, 2.09326171875, 2.5374755859375, 2.981689453125, 3.4259033203125, 3.8701171875, 4.3143310546875, 4.758544921875, 5.2027587890625, 5.64697265625, 6.0911865234375, 6.535400390625, 6.9796142578125, 7.423828125, 7.8680419921875, 8.312255859375, 8.7564697265625, 9.20068359375, 9.6448974609375, 10.089111328125, 10.5333251953125, 10.9775390625, 11.4217529296875, 11.865966796875, 12.3101806640625, 12.75439453125, 13.1986083984375, 13.642822265625, 14.0870361328125, 14.53125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 8.0, 9.0, 12.0, 19.0, 21.0, 22.0, 24.0, 31.0, 40.0, 40.0, 46.0, 55.0, 50.0, 53.0, 39.0, 59.0, 45.0, 59.0, 41.0, 54.0, 38.0, 30.0, 37.0, 36.0, 18.0, 19.0, 18.0, 13.0, 6.0, 7.0, 8.0, 3.0, 7.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.1875, -10.828369140625, -10.46923828125, -10.110107421875, -9.7509765625, -9.391845703125, -9.03271484375, -8.673583984375, -8.314453125, -7.955322265625, -7.59619140625, -7.237060546875, -6.8779296875, -6.518798828125, -6.15966796875, -5.800537109375, -5.44140625, -5.082275390625, -4.72314453125, -4.364013671875, -4.0048828125, -3.645751953125, -3.28662109375, -2.927490234375, -2.568359375, -2.209228515625, -1.85009765625, -1.490966796875, -1.1318359375, -0.772705078125, -0.41357421875, -0.054443359375, 0.3046875, 0.663818359375, 1.02294921875, 1.382080078125, 1.7412109375, 2.100341796875, 2.45947265625, 2.818603515625, 3.177734375, 3.536865234375, 3.89599609375, 4.255126953125, 4.6142578125, 4.973388671875, 5.33251953125, 5.691650390625, 6.05078125, 6.409912109375, 6.76904296875, 7.128173828125, 7.4873046875, 7.846435546875, 8.20556640625, 8.564697265625, 8.923828125, 9.282958984375, 9.64208984375, 10.001220703125, 10.3603515625, 10.719482421875, 11.07861328125, 11.437744140625, 11.796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 7.0, 5.0, 4.0, 7.0, 7.0, 14.0, 18.0, 23.0, 23.0, 31.0, 50.0, 72.0, 100.0, 176.0, 337.0, 711.0, 1801.0, 5121.0, 20402.0, 124867.0, 778558.0, 92438.0, 16433.0, 4403.0, 1532.0, 619.0, 303.0, 189.0, 86.0, 59.0, 40.0, 37.0, 14.0, 15.0, 18.0, 9.0, 13.0, 9.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.2625732421875, -4.107177734375, -3.9517822265625, -3.79638671875, -3.6409912109375, -3.485595703125, -3.3302001953125, -3.1748046875, -3.0194091796875, -2.864013671875, -2.7086181640625, -2.55322265625, -2.3978271484375, -2.242431640625, -2.0870361328125, -1.931640625, -1.7762451171875, -1.620849609375, -1.4654541015625, -1.31005859375, -1.1546630859375, -0.999267578125, -0.8438720703125, -0.6884765625, -0.5330810546875, -0.377685546875, -0.2222900390625, -0.06689453125, 0.0885009765625, 0.243896484375, 0.3992919921875, 0.5546875, 0.7100830078125, 0.865478515625, 1.0208740234375, 1.17626953125, 1.3316650390625, 1.487060546875, 1.6424560546875, 1.7978515625, 1.9532470703125, 2.108642578125, 2.2640380859375, 2.41943359375, 2.5748291015625, 2.730224609375, 2.8856201171875, 3.041015625, 3.1964111328125, 3.351806640625, 3.5072021484375, 3.66259765625, 3.8179931640625, 3.973388671875, 4.1287841796875, 4.2841796875, 4.4395751953125, 4.594970703125, 4.7503662109375, 4.90576171875, 5.0611572265625, 5.216552734375, 5.3719482421875, 5.52734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 5.0, 8.0, 8.0, 13.0, 13.0, 22.0, 30.0, 31.0, 47.0, 58.0, 93.0, 110.0, 102.0, 99.0, 83.0, 50.0, 29.0, 32.0, 21.0, 14.0, 15.0, 15.0, 12.0, 10.0, 5.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0008516311645507812, -0.000825829803943634, -0.0008000284433364868, -0.0007742270827293396, -0.0007484257221221924, -0.0007226243615150452, -0.000696823000907898, -0.0006710216403007507, -0.0006452202796936035, -0.0006194189190864563, -0.0005936175584793091, -0.0005678161978721619, -0.0005420148372650146, -0.0005162134766578674, -0.0004904121160507202, -0.000464610755443573, -0.0004388093948364258, -0.00041300803422927856, -0.00038720667362213135, -0.00036140531301498413, -0.0003356039524078369, -0.0003098025918006897, -0.0002840012311935425, -0.00025819987058639526, -0.00023239850997924805, -0.00020659714937210083, -0.0001807957887649536, -0.0001549944281578064, -0.00012919306755065918, -0.00010339170694351196, -7.759034633636475e-05, -5.178898572921753e-05, -2.5987625122070312e-05, -1.862645149230957e-07, 2.561509609222412e-05, 5.141645669937134e-05, 7.721781730651855e-05, 0.00010301917791366577, 0.000128820538520813, 0.0001546218991279602, 0.00018042325973510742, 0.00020622462034225464, 0.00023202598094940186, 0.00025782734155654907, 0.0002836287021636963, 0.0003094300627708435, 0.0003352314233779907, 0.00036103278398513794, 0.00038683414459228516, 0.0004126355051994324, 0.0004384368658065796, 0.0004642382264137268, 0.000490039587020874, 0.0005158409476280212, 0.0005416423082351685, 0.0005674436688423157, 0.0005932450294494629, 0.0006190463900566101, 0.0006448477506637573, 0.0006706491112709045, 0.0006964504718780518, 0.000722251832485199, 0.0007480531930923462, 0.0007738545536994934, 0.0007996559143066406]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 13.0, 17.0, 27.0, 41.0, 53.0, 92.0, 133.0, 205.0, 311.0, 587.0, 992.0, 2244.0, 5866.0, 19457.0, 96064.0, 722226.0, 158809.0, 27807.0, 7898.0, 2873.0, 1235.0, 612.0, 327.0, 214.0, 131.0, 98.0, 55.0, 34.0, 32.0, 20.0, 20.0, 8.0, 15.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.806640625, -3.682342529296875, -3.55804443359375, -3.433746337890625, -3.3094482421875, -3.185150146484375, -3.06085205078125, -2.936553955078125, -2.812255859375, -2.687957763671875, -2.56365966796875, -2.439361572265625, -2.3150634765625, -2.190765380859375, -2.06646728515625, -1.942169189453125, -1.81787109375, -1.693572998046875, -1.56927490234375, -1.444976806640625, -1.3206787109375, -1.196380615234375, -1.07208251953125, -0.947784423828125, -0.823486328125, -0.699188232421875, -0.57489013671875, -0.450592041015625, -0.3262939453125, -0.201995849609375, -0.07769775390625, 0.046600341796875, 0.1708984375, 0.295196533203125, 0.41949462890625, 0.543792724609375, 0.6680908203125, 0.792388916015625, 0.91668701171875, 1.040985107421875, 1.165283203125, 1.289581298828125, 1.41387939453125, 1.538177490234375, 1.6624755859375, 1.786773681640625, 1.91107177734375, 2.035369873046875, 2.15966796875, 2.283966064453125, 2.40826416015625, 2.532562255859375, 2.6568603515625, 2.781158447265625, 2.90545654296875, 3.029754638671875, 3.154052734375, 3.278350830078125, 3.40264892578125, 3.526947021484375, 3.6512451171875, 3.775543212890625, 3.89984130859375, 4.024139404296875, 4.1484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 10.0, 5.0, 12.0, 11.0, 9.0, 18.0, 33.0, 57.0, 79.0, 100.0, 156.0, 125.0, 84.0, 77.0, 65.0, 34.0, 21.0, 19.0, 15.0, 18.0, 11.0, 10.0, 4.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.24609375, -5.111541748046875, -4.97698974609375, -4.842437744140625, -4.7078857421875, -4.573333740234375, -4.43878173828125, -4.304229736328125, -4.169677734375, -4.035125732421875, -3.90057373046875, -3.766021728515625, -3.6314697265625, -3.496917724609375, -3.36236572265625, -3.227813720703125, -3.09326171875, -2.958709716796875, -2.82415771484375, -2.689605712890625, -2.5550537109375, -2.420501708984375, -2.28594970703125, -2.151397705078125, -2.016845703125, -1.882293701171875, -1.74774169921875, -1.613189697265625, -1.4786376953125, -1.344085693359375, -1.20953369140625, -1.074981689453125, -0.9404296875, -0.805877685546875, -0.67132568359375, -0.536773681640625, -0.4022216796875, -0.267669677734375, -0.13311767578125, 0.001434326171875, 0.135986328125, 0.270538330078125, 0.40509033203125, 0.539642333984375, 0.6741943359375, 0.808746337890625, 0.94329833984375, 1.077850341796875, 1.21240234375, 1.346954345703125, 1.48150634765625, 1.616058349609375, 1.7506103515625, 1.885162353515625, 2.01971435546875, 2.154266357421875, 2.288818359375, 2.423370361328125, 2.55792236328125, 2.692474365234375, 2.8270263671875, 2.961578369140625, 3.09613037109375, 3.230682373046875, 3.365234375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 11.0, 22.0, 34.0, 57.0, 121.0, 272.0, 247.0, 109.0, 52.0, 22.0, 13.0, 9.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.71632385253906, -85.12987518310547, -82.54341888427734, -79.95697021484375, -77.37051391601562, -74.78406524658203, -72.1976089477539, -69.61116027832031, -67.02470397949219, -64.4382553100586, -61.85179901123047, -59.26534652709961, -56.67889404296875, -54.092445373535156, -51.5059928894043, -48.91954040527344, -46.333091735839844, -43.746639251708984, -41.160186767578125, -38.573734283447266, -35.987281799316406, -33.40083312988281, -30.814380645751953, -28.227928161621094, -25.641475677490234, -23.055023193359375, -20.468570709228516, -17.88212013244629, -15.29566764831543, -12.70921516418457, -10.122763633728027, -7.536312103271484, -4.949867248535156, -2.363415241241455, 0.2230367660522461, 2.8094887733459473, 5.395940780639648, 7.982393264770508, 10.56884479522705, 13.155296325683594, 15.741748809814453, 18.328201293945312, 20.914653778076172, 23.5011043548584, 26.087556838989258, 28.674009323120117, 31.260459899902344, 33.8469123840332, 36.43336486816406, 39.01981735229492, 41.60626983642578, 44.19272232055664, 46.7791748046875, 49.365623474121094, 51.95207595825195, 54.53852844238281, 57.12498092651367, 59.71143341064453, 62.29788589477539, 64.88433837890625, 67.47078704833984, 70.05724334716797, 72.64369201660156, 75.23014831542969, 77.81659698486328]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 1.0, 11.0, 10.0, 19.0, 10.0, 22.0, 9.0, 23.0, 26.0, 29.0, 32.0, 23.0, 29.0, 37.0, 64.0, 60.0, 87.0, 71.0, 61.0, 55.0, 36.0, 40.0, 41.0, 25.0, 32.0, 22.0, 20.0, 14.0, 19.0, 20.0, 7.0, 6.0, 4.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.73350524902344, -45.311912536621094, -43.89031982421875, -42.468727111816406, -41.04713821411133, -39.625545501708984, -38.20395278930664, -36.7823600769043, -35.36076736450195, -33.93917465209961, -32.517581939697266, -31.095991134643555, -29.67439842224121, -28.2528076171875, -26.831214904785156, -25.409622192382812, -23.9880313873291, -22.566438674926758, -21.144847869873047, -19.723255157470703, -18.30166244506836, -16.880069732666016, -15.458478927612305, -14.036886215209961, -12.615294456481934, -11.193702697753906, -9.772109985351562, -8.350518226623535, -6.92892599105835, -5.507333755493164, -4.085741996765137, -2.664149284362793, -1.2425575256347656, 0.17903459072113037, 1.6006267070770264, 3.022218704223633, 4.443810939788818, 5.865403175354004, 7.286994934082031, 8.708587646484375, 10.130179405212402, 11.55177116394043, 12.973363876342773, 14.3949556350708, 15.816547393798828, 17.238140106201172, 18.659732818603516, 20.08132553100586, 21.50291633605957, 22.924509048461914, 24.346099853515625, 25.76769256591797, 27.189285278320312, 28.610877990722656, 30.032468795776367, 31.45406150817871, 32.87565231323242, 34.297245025634766, 35.71883773803711, 37.14042663574219, 38.56201934814453, 39.983612060546875, 41.40520477294922, 42.82679748535156, 44.248390197753906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 6.0, 10.0, 15.0, 12.0, 22.0, 24.0, 32.0, 57.0, 66.0, 116.0, 254.0, 361.0, 928.0, 3185.0, 17494.0, 283281.0, 3616333.0, 245522.0, 19905.0, 4207.0, 1299.0, 519.0, 287.0, 146.0, 81.0, 41.0, 31.0, 19.0, 10.0, 9.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.811767578125, -8.57666015625, -8.341552734375, -8.1064453125, -7.871337890625, -7.63623046875, -7.401123046875, -7.166015625, -6.930908203125, -6.69580078125, -6.460693359375, -6.2255859375, -5.990478515625, -5.75537109375, -5.520263671875, -5.28515625, -5.050048828125, -4.81494140625, -4.579833984375, -4.3447265625, -4.109619140625, -3.87451171875, -3.639404296875, -3.404296875, -3.169189453125, -2.93408203125, -2.698974609375, -2.4638671875, -2.228759765625, -1.99365234375, -1.758544921875, -1.5234375, -1.288330078125, -1.05322265625, -0.818115234375, -0.5830078125, -0.347900390625, -0.11279296875, 0.122314453125, 0.357421875, 0.592529296875, 0.82763671875, 1.062744140625, 1.2978515625, 1.532958984375, 1.76806640625, 2.003173828125, 2.23828125, 2.473388671875, 2.70849609375, 2.943603515625, 3.1787109375, 3.413818359375, 3.64892578125, 3.884033203125, 4.119140625, 4.354248046875, 4.58935546875, 4.824462890625, 5.0595703125, 5.294677734375, 5.52978515625, 5.764892578125, 6.0]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 9.0, 2.0, 5.0, 6.0, 5.0, 16.0, 18.0, 18.0, 21.0, 36.0, 34.0, 55.0, 44.0, 66.0, 71.0, 86.0, 51.0, 65.0, 70.0, 61.0, 69.0, 49.0, 30.0, 31.0, 24.0, 11.0, 14.0, 13.0, 10.0, 12.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.58203125, -4.478057861328125, -4.37408447265625, -4.270111083984375, -4.1661376953125, -4.062164306640625, -3.95819091796875, -3.854217529296875, -3.750244140625, -3.646270751953125, -3.54229736328125, -3.438323974609375, -3.3343505859375, -3.230377197265625, -3.12640380859375, -3.022430419921875, -2.91845703125, -2.814483642578125, -2.71051025390625, -2.606536865234375, -2.5025634765625, -2.398590087890625, -2.29461669921875, -2.190643310546875, -2.086669921875, -1.982696533203125, -1.87872314453125, -1.774749755859375, -1.6707763671875, -1.566802978515625, -1.46282958984375, -1.358856201171875, -1.2548828125, -1.150909423828125, -1.04693603515625, -0.942962646484375, -0.8389892578125, -0.735015869140625, -0.63104248046875, -0.527069091796875, -0.423095703125, -0.319122314453125, -0.21514892578125, -0.111175537109375, -0.0072021484375, 0.096771240234375, 0.20074462890625, 0.304718017578125, 0.40869140625, 0.512664794921875, 0.61663818359375, 0.720611572265625, 0.8245849609375, 0.928558349609375, 1.03253173828125, 1.136505126953125, 1.240478515625, 1.344451904296875, 1.44842529296875, 1.552398681640625, 1.6563720703125, 1.760345458984375, 1.86431884765625, 1.968292236328125, 2.072265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 4.0, 6.0, 11.0, 14.0, 43.0, 44.0, 106.0, 207.0, 348.0, 730.0, 1604.0, 4415.0, 25627.0, 2093740.0, 2036024.0, 24489.0, 4097.0, 1439.0, 649.0, 298.0, 181.0, 85.0, 39.0, 30.0, 14.0, 10.0, 8.0, 8.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7734375, -14.363037109375, -13.95263671875, -13.542236328125, -13.1318359375, -12.721435546875, -12.31103515625, -11.900634765625, -11.490234375, -11.079833984375, -10.66943359375, -10.259033203125, -9.8486328125, -9.438232421875, -9.02783203125, -8.617431640625, -8.20703125, -7.796630859375, -7.38623046875, -6.975830078125, -6.5654296875, -6.155029296875, -5.74462890625, -5.334228515625, -4.923828125, -4.513427734375, -4.10302734375, -3.692626953125, -3.2822265625, -2.871826171875, -2.46142578125, -2.051025390625, -1.640625, -1.230224609375, -0.81982421875, -0.409423828125, 0.0009765625, 0.411376953125, 0.82177734375, 1.232177734375, 1.642578125, 2.052978515625, 2.46337890625, 2.873779296875, 3.2841796875, 3.694580078125, 4.10498046875, 4.515380859375, 4.92578125, 5.336181640625, 5.74658203125, 6.156982421875, 6.5673828125, 6.977783203125, 7.38818359375, 7.798583984375, 8.208984375, 8.619384765625, 9.02978515625, 9.440185546875, 9.8505859375, 10.260986328125, 10.67138671875, 11.081787109375, 11.4921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 24.0, 23.0, 50.0, 105.0, 248.0, 739.0, 1361.0, 901.0, 347.0, 136.0, 64.0, 24.0, 17.0, 9.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.421875, -15.0008544921875, -14.579833984375, -14.1588134765625, -13.73779296875, -13.3167724609375, -12.895751953125, -12.4747314453125, -12.0537109375, -11.6326904296875, -11.211669921875, -10.7906494140625, -10.36962890625, -9.9486083984375, -9.527587890625, -9.1065673828125, -8.685546875, -8.2645263671875, -7.843505859375, -7.4224853515625, -7.00146484375, -6.5804443359375, -6.159423828125, -5.7384033203125, -5.3173828125, -4.8963623046875, -4.475341796875, -4.0543212890625, -3.63330078125, -3.2122802734375, -2.791259765625, -2.3702392578125, -1.94921875, -1.5281982421875, -1.107177734375, -0.6861572265625, -0.26513671875, 0.1558837890625, 0.576904296875, 0.9979248046875, 1.4189453125, 1.8399658203125, 2.260986328125, 2.6820068359375, 3.10302734375, 3.5240478515625, 3.945068359375, 4.3660888671875, 4.787109375, 5.2081298828125, 5.629150390625, 6.0501708984375, 6.47119140625, 6.8922119140625, 7.313232421875, 7.7342529296875, 8.1552734375, 8.5762939453125, 8.997314453125, 9.4183349609375, 9.83935546875, 10.2603759765625, 10.681396484375, 11.1024169921875, 11.5234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 10.0, 27.0, 75.0, 177.0, 285.0, 271.0, 78.0, 26.0, 11.0, 9.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-151.2151336669922, -147.9761505126953, -144.73715209960938, -141.4981689453125, -138.25917053222656, -135.0201873779297, -131.78118896484375, -128.54220581054688, -125.30320739746094, -122.06421661376953, -118.82522583007812, -115.58623504638672, -112.34724426269531, -109.1082534790039, -105.8692626953125, -102.63027954101562, -99.39128875732422, -96.15229797363281, -92.9133071899414, -89.67431640625, -86.4353256225586, -83.19633483886719, -79.95735168457031, -76.71835327148438, -73.4793701171875, -70.2403793334961, -67.00138854980469, -63.76239776611328, -60.523406982421875, -57.28441619873047, -54.04542922973633, -50.80643844604492, -47.56745147705078, -44.328460693359375, -41.08946990966797, -37.85047912597656, -34.611488342285156, -31.372499465942383, -28.13351058959961, -24.894519805908203, -21.655529022216797, -18.41653823852539, -15.1775484085083, -11.938558578491211, -8.699567794799805, -5.460577011108398, -2.221588134765625, 1.0174026489257812, 4.2563934326171875, 7.4953837394714355, 10.734374046325684, 13.973363876342773, 17.21235466003418, 20.451345443725586, 23.69033432006836, 26.929325103759766, 30.168315887451172, 33.40730667114258, 36.646297454833984, 39.885284423828125, 43.12427520751953, 46.36326599121094, 49.602256774902344, 52.84124755859375, 56.080238342285156]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 9.0, 9.0, 12.0, 18.0, 41.0, 54.0, 55.0, 83.0, 104.0, 121.0, 111.0, 96.0, 84.0, 63.0, 43.0, 42.0, 27.0, 14.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.93925476074219, -54.924468994140625, -52.9096794128418, -50.894893646240234, -48.880104064941406, -46.865318298339844, -44.85053253173828, -42.83574676513672, -40.82095718383789, -38.80617141723633, -36.7913818359375, -34.77659606933594, -32.761810302734375, -30.747020721435547, -28.732234954833984, -26.71744728088379, -24.702659606933594, -22.6878719329834, -20.673084259033203, -18.65829849243164, -16.643510818481445, -14.62872314453125, -12.613936424255371, -10.599149703979492, -8.584362030029297, -6.56957483291626, -4.554787635803223, -2.5400004386901855, -0.5252132415771484, 1.4895744323730469, 3.504361152648926, 5.519147872924805, 7.533927917480469, 9.548715591430664, 11.563502311706543, 13.578289031982422, 15.593076705932617, 17.607864379882812, 19.622650146484375, 21.63743782043457, 23.652225494384766, 25.66701316833496, 27.681800842285156, 29.69658660888672, 31.711374282836914, 33.72616195678711, 35.74094772338867, 37.7557373046875, 39.77052307128906, 41.785308837890625, 43.80009841918945, 45.814884185791016, 47.829673767089844, 49.844459533691406, 51.85924530029297, 53.87403106689453, 55.88882064819336, 57.90360641479492, 59.91839599609375, 61.93318176269531, 63.947967529296875, 65.96275329589844, 67.97754669189453, 69.9923324584961, 72.00711822509766]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 16.0, 11.0, 16.0, 20.0, 20.0, 31.0, 47.0, 99.0, 185.0, 344.0, 784.0, 2107.0, 5839.0, 23865.0, 229951.0, 666696.0, 98054.0, 13544.0, 4088.0, 1563.0, 609.0, 271.0, 140.0, 87.0, 50.0, 29.0, 13.0, 19.0, 9.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.8359375, -7.607666015625, -7.37939453125, -7.151123046875, -6.9228515625, -6.694580078125, -6.46630859375, -6.238037109375, -6.009765625, -5.781494140625, -5.55322265625, -5.324951171875, -5.0966796875, -4.868408203125, -4.64013671875, -4.411865234375, -4.18359375, -3.955322265625, -3.72705078125, -3.498779296875, -3.2705078125, -3.042236328125, -2.81396484375, -2.585693359375, -2.357421875, -2.129150390625, -1.90087890625, -1.672607421875, -1.4443359375, -1.216064453125, -0.98779296875, -0.759521484375, -0.53125, -0.302978515625, -0.07470703125, 0.153564453125, 0.3818359375, 0.610107421875, 0.83837890625, 1.066650390625, 1.294921875, 1.523193359375, 1.75146484375, 1.979736328125, 2.2080078125, 2.436279296875, 2.66455078125, 2.892822265625, 3.12109375, 3.349365234375, 3.57763671875, 3.805908203125, 4.0341796875, 4.262451171875, 4.49072265625, 4.718994140625, 4.947265625, 5.175537109375, 5.40380859375, 5.632080078125, 5.8603515625, 6.088623046875, 6.31689453125, 6.545166015625, 6.7734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 3.0, 10.0, 13.0, 34.0, 34.0, 44.0, 56.0, 56.0, 71.0, 71.0, 86.0, 82.0, 89.0, 70.0, 61.0, 50.0, 41.0, 32.0, 27.0, 22.0, 14.0, 9.0, 6.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.2010498046875, -4.070068359375, -3.9390869140625, -3.80810546875, -3.6771240234375, -3.546142578125, -3.4151611328125, -3.2841796875, -3.1531982421875, -3.022216796875, -2.8912353515625, -2.76025390625, -2.6292724609375, -2.498291015625, -2.3673095703125, -2.236328125, -2.1053466796875, -1.974365234375, -1.8433837890625, -1.71240234375, -1.5814208984375, -1.450439453125, -1.3194580078125, -1.1884765625, -1.0574951171875, -0.926513671875, -0.7955322265625, -0.66455078125, -0.5335693359375, -0.402587890625, -0.2716064453125, -0.140625, -0.0096435546875, 0.121337890625, 0.2523193359375, 0.38330078125, 0.5142822265625, 0.645263671875, 0.7762451171875, 0.9072265625, 1.0382080078125, 1.169189453125, 1.3001708984375, 1.43115234375, 1.5621337890625, 1.693115234375, 1.8240966796875, 1.955078125, 2.0860595703125, 2.217041015625, 2.3480224609375, 2.47900390625, 2.6099853515625, 2.740966796875, 2.8719482421875, 3.0029296875, 3.1339111328125, 3.264892578125, 3.3958740234375, 3.52685546875, 3.6578369140625, 3.788818359375, 3.9197998046875, 4.05078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 5.0, 7.0, 10.0, 10.0, 10.0, 24.0, 22.0, 37.0, 77.0, 86.0, 175.0, 274.0, 602.0, 1242.0, 3000.0, 8936.0, 49124.0, 623182.0, 317541.0, 32708.0, 6809.0, 2391.0, 1046.0, 503.0, 270.0, 147.0, 97.0, 66.0, 51.0, 29.0, 20.0, 18.0, 10.0, 8.0, 2.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3984375, -8.15777587890625, -7.9171142578125, -7.67645263671875, -7.435791015625, -7.19512939453125, -6.9544677734375, -6.71380615234375, -6.47314453125, -6.23248291015625, -5.9918212890625, -5.75115966796875, -5.510498046875, -5.26983642578125, -5.0291748046875, -4.78851318359375, -4.5478515625, -4.30718994140625, -4.0665283203125, -3.82586669921875, -3.585205078125, -3.34454345703125, -3.1038818359375, -2.86322021484375, -2.62255859375, -2.38189697265625, -2.1412353515625, -1.90057373046875, -1.659912109375, -1.41925048828125, -1.1785888671875, -0.93792724609375, -0.697265625, -0.45660400390625, -0.2159423828125, 0.02471923828125, 0.265380859375, 0.50604248046875, 0.7467041015625, 0.98736572265625, 1.22802734375, 1.46868896484375, 1.7093505859375, 1.95001220703125, 2.190673828125, 2.43133544921875, 2.6719970703125, 2.91265869140625, 3.1533203125, 3.39398193359375, 3.6346435546875, 3.87530517578125, 4.115966796875, 4.35662841796875, 4.5972900390625, 4.83795166015625, 5.07861328125, 5.31927490234375, 5.5599365234375, 5.80059814453125, 6.041259765625, 6.28192138671875, 6.5225830078125, 6.76324462890625, 7.00390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 13.0, 23.0, 25.0, 38.0, 36.0, 36.0, 64.0, 46.0, 60.0, 53.0, 62.0, 58.0, 64.0, 54.0, 44.0, 54.0, 44.0, 39.0, 28.0, 24.0, 17.0, 23.0, 12.0, 14.0, 13.0, 11.0, 3.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.1317138671875, -10.755615234375, -10.3795166015625, -10.00341796875, -9.6273193359375, -9.251220703125, -8.8751220703125, -8.4990234375, -8.1229248046875, -7.746826171875, -7.3707275390625, -6.99462890625, -6.6185302734375, -6.242431640625, -5.8663330078125, -5.490234375, -5.1141357421875, -4.738037109375, -4.3619384765625, -3.98583984375, -3.6097412109375, -3.233642578125, -2.8575439453125, -2.4814453125, -2.1053466796875, -1.729248046875, -1.3531494140625, -0.97705078125, -0.6009521484375, -0.224853515625, 0.1512451171875, 0.52734375, 0.9034423828125, 1.279541015625, 1.6556396484375, 2.03173828125, 2.4078369140625, 2.783935546875, 3.1600341796875, 3.5361328125, 3.9122314453125, 4.288330078125, 4.6644287109375, 5.04052734375, 5.4166259765625, 5.792724609375, 6.1688232421875, 6.544921875, 6.9210205078125, 7.297119140625, 7.6732177734375, 8.04931640625, 8.4254150390625, 8.801513671875, 9.1776123046875, 9.5537109375, 9.9298095703125, 10.305908203125, 10.6820068359375, 11.05810546875, 11.4342041015625, 11.810302734375, 12.1864013671875, 12.5625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 6.0, 5.0, 13.0, 12.0, 34.0, 39.0, 65.0, 109.0, 188.0, 325.0, 605.0, 1070.0, 2275.0, 5441.0, 19467.0, 140700.0, 763880.0, 91083.0, 14487.0, 4591.0, 1937.0, 958.0, 538.0, 293.0, 161.0, 111.0, 45.0, 36.0, 30.0, 10.0, 6.0, 7.0, 11.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.8203125, -3.702423095703125, -3.58453369140625, -3.466644287109375, -3.3487548828125, -3.230865478515625, -3.11297607421875, -2.995086669921875, -2.877197265625, -2.759307861328125, -2.64141845703125, -2.523529052734375, -2.4056396484375, -2.287750244140625, -2.16986083984375, -2.051971435546875, -1.93408203125, -1.816192626953125, -1.69830322265625, -1.580413818359375, -1.4625244140625, -1.344635009765625, -1.22674560546875, -1.108856201171875, -0.990966796875, -0.873077392578125, -0.75518798828125, -0.637298583984375, -0.5194091796875, -0.401519775390625, -0.28363037109375, -0.165740966796875, -0.0478515625, 0.070037841796875, 0.18792724609375, 0.305816650390625, 0.4237060546875, 0.541595458984375, 0.65948486328125, 0.777374267578125, 0.895263671875, 1.013153076171875, 1.13104248046875, 1.248931884765625, 1.3668212890625, 1.484710693359375, 1.60260009765625, 1.720489501953125, 1.83837890625, 1.956268310546875, 2.07415771484375, 2.192047119140625, 2.3099365234375, 2.427825927734375, 2.54571533203125, 2.663604736328125, 2.781494140625, 2.899383544921875, 3.01727294921875, 3.135162353515625, 3.2530517578125, 3.370941162109375, 3.48883056640625, 3.606719970703125, 3.724609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 9.0, 15.0, 50.0, 124.0, 197.0, 304.0, 161.0, 72.0, 33.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0019254684448242188, -0.0018675774335861206, -0.0018096864223480225, -0.0017517954111099243, -0.0016939043998718262, -0.001636013388633728, -0.0015781223773956299, -0.0015202313661575317, -0.0014623403549194336, -0.0014044493436813354, -0.0013465583324432373, -0.0012886673212051392, -0.001230776309967041, -0.0011728852987289429, -0.0011149942874908447, -0.0010571032762527466, -0.0009992122650146484, -0.0009413212537765503, -0.0008834302425384521, -0.000825539231300354, -0.0007676482200622559, -0.0007097572088241577, -0.0006518661975860596, -0.0005939751863479614, -0.0005360841751098633, -0.00047819316387176514, -0.000420302152633667, -0.00036241114139556885, -0.0003045201301574707, -0.00024662911891937256, -0.00018873810768127441, -0.00013084709644317627, -7.295608520507812e-05, -1.506507396697998e-05, 4.2825937271118164e-05, 0.00010071694850921631, 0.00015860795974731445, 0.0002164989709854126, 0.00027438998222351074, 0.0003322809934616089, 0.00039017200469970703, 0.0004480630159378052, 0.0005059540271759033, 0.0005638450384140015, 0.0006217360496520996, 0.0006796270608901978, 0.0007375180721282959, 0.000795409083366394, 0.0008533000946044922, 0.0009111911058425903, 0.0009690821170806885, 0.0010269731283187866, 0.0010848641395568848, 0.001142755150794983, 0.001200646162033081, 0.0012585371732711792, 0.0013164281845092773, 0.0013743191957473755, 0.0014322102069854736, 0.0014901012182235718, 0.00154799222946167, 0.001605883240699768, 0.0016637742519378662, 0.0017216652631759644, 0.0017795562744140625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 8.0, 15.0, 20.0, 47.0, 85.0, 148.0, 310.0, 778.0, 2353.0, 8716.0, 57710.0, 770865.0, 182403.0, 18940.0, 4063.0, 1227.0, 442.0, 225.0, 86.0, 36.0, 27.0, 19.0, 13.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.73046875, -5.582489013671875, -5.43450927734375, -5.286529541015625, -5.1385498046875, -4.990570068359375, -4.84259033203125, -4.694610595703125, -4.546630859375, -4.398651123046875, -4.25067138671875, -4.102691650390625, -3.9547119140625, -3.806732177734375, -3.65875244140625, -3.510772705078125, -3.36279296875, -3.214813232421875, -3.06683349609375, -2.918853759765625, -2.7708740234375, -2.622894287109375, -2.47491455078125, -2.326934814453125, -2.178955078125, -2.030975341796875, -1.88299560546875, -1.735015869140625, -1.5870361328125, -1.439056396484375, -1.29107666015625, -1.143096923828125, -0.9951171875, -0.847137451171875, -0.69915771484375, -0.551177978515625, -0.4031982421875, -0.255218505859375, -0.10723876953125, 0.040740966796875, 0.188720703125, 0.336700439453125, 0.48468017578125, 0.632659912109375, 0.7806396484375, 0.928619384765625, 1.07659912109375, 1.224578857421875, 1.37255859375, 1.520538330078125, 1.66851806640625, 1.816497802734375, 1.9644775390625, 2.112457275390625, 2.26043701171875, 2.408416748046875, 2.556396484375, 2.704376220703125, 2.85235595703125, 3.000335693359375, 3.1483154296875, 3.296295166015625, 3.44427490234375, 3.592254638671875, 3.740234375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 5.0, 10.0, 10.0, 21.0, 29.0, 44.0, 75.0, 100.0, 128.0, 143.0, 107.0, 99.0, 64.0, 41.0, 29.0, 27.0, 17.0, 9.0, 5.0, 8.0, 6.0, 2.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.171875, -4.0577392578125, -3.943603515625, -3.8294677734375, -3.71533203125, -3.6011962890625, -3.487060546875, -3.3729248046875, -3.2587890625, -3.1446533203125, -3.030517578125, -2.9163818359375, -2.80224609375, -2.6881103515625, -2.573974609375, -2.4598388671875, -2.345703125, -2.2315673828125, -2.117431640625, -2.0032958984375, -1.88916015625, -1.7750244140625, -1.660888671875, -1.5467529296875, -1.4326171875, -1.3184814453125, -1.204345703125, -1.0902099609375, -0.97607421875, -0.8619384765625, -0.747802734375, -0.6336669921875, -0.51953125, -0.4053955078125, -0.291259765625, -0.1771240234375, -0.06298828125, 0.0511474609375, 0.165283203125, 0.2794189453125, 0.3935546875, 0.5076904296875, 0.621826171875, 0.7359619140625, 0.85009765625, 0.9642333984375, 1.078369140625, 1.1925048828125, 1.306640625, 1.4207763671875, 1.534912109375, 1.6490478515625, 1.76318359375, 1.8773193359375, 1.991455078125, 2.1055908203125, 2.2197265625, 2.3338623046875, 2.447998046875, 2.5621337890625, 2.67626953125, 2.7904052734375, 2.904541015625, 3.0186767578125, 3.1328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 5.0, 12.0, 51.0, 116.0, 194.0, 323.0, 162.0, 73.0, 28.0, 17.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.83662414550781, -87.14225006103516, -84.4478759765625, -81.75349426269531, -79.05912017822266, -76.36474609375, -73.67037200927734, -70.97599792480469, -68.2816162109375, -65.58724212646484, -62.89286422729492, -60.198490142822266, -57.504112243652344, -54.80973815917969, -52.11536407470703, -49.420989990234375, -46.72661590576172, -44.03224182128906, -41.33786392211914, -38.643489837646484, -35.94911193847656, -33.254737854003906, -30.56036376953125, -27.86598777770996, -25.171611785888672, -22.477235794067383, -19.782859802246094, -17.088485717773438, -14.394109725952148, -11.69973373413086, -9.005359649658203, -6.310983657836914, -3.6166152954101562, -0.9222397804260254, 1.7721357345581055, 4.466510772705078, 7.160886764526367, 9.855262756347656, 12.549636840820312, 15.244012832641602, 17.93838882446289, 20.63276481628418, 23.32714080810547, 26.021514892578125, 28.715890884399414, 31.410266876220703, 34.10464096069336, 36.79901885986328, 39.49339294433594, 42.187767028808594, 44.882144927978516, 47.57651901245117, 50.270896911621094, 52.96527099609375, 55.659645080566406, 58.35401916503906, 61.048397064208984, 63.74277114868164, 66.43714904785156, 69.13152313232422, 71.82589721679688, 74.52027893066406, 77.21464538574219, 79.90902709960938, 82.60340118408203]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 5.0, 9.0, 13.0, 10.0, 15.0, 16.0, 30.0, 38.0, 48.0, 41.0, 68.0, 98.0, 83.0, 104.0, 80.0, 66.0, 56.0, 55.0, 35.0, 21.0, 26.0, 20.0, 14.0, 10.0, 17.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.59827423095703, -43.78861618041992, -41.97895812988281, -40.16929626464844, -38.35963821411133, -36.54998016357422, -34.740318298339844, -32.930660247802734, -31.121002197265625, -29.311344146728516, -27.501684188842773, -25.69202423095703, -23.882366180419922, -22.072708129882812, -20.26304817199707, -18.453388214111328, -16.64373016357422, -14.834071159362793, -13.024412155151367, -11.214753150939941, -9.405094146728516, -7.59543514251709, -5.785776138305664, -3.9761171340942383, -2.1664581298828125, -0.3567991256713867, 1.452859878540039, 3.262518882751465, 5.072177886962891, 6.881836891174316, 8.691495895385742, 10.501154899597168, 12.310813903808594, 14.12047290802002, 15.930131912231445, 17.739791870117188, 19.549449920654297, 21.359107971191406, 23.16876792907715, 24.97842788696289, 26.7880859375, 28.59774398803711, 30.40740394592285, 32.217063903808594, 34.0267219543457, 35.83638000488281, 37.64604187011719, 39.4556999206543, 41.265357971191406, 43.075016021728516, 44.884674072265625, 46.6943359375, 48.50399398803711, 50.31365203857422, 52.123313903808594, 53.9329719543457, 55.74263000488281, 57.55228805541992, 59.36194610595703, 61.171607971191406, 62.981266021728516, 64.79092407226562, 66.6005859375, 68.41024017333984, 70.21990203857422]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 4.0, 10.0, 20.0, 22.0, 19.0, 53.0, 98.0, 174.0, 367.0, 757.0, 2080.0, 8074.0, 64704.0, 2029549.0, 2013244.0, 64123.0, 8061.0, 1847.0, 604.0, 218.0, 101.0, 64.0, 37.0, 18.0, 6.0, 7.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.4549560546875, -7.241943359375, -7.0289306640625, -6.81591796875, -6.6029052734375, -6.389892578125, -6.1768798828125, -5.9638671875, -5.7508544921875, -5.537841796875, -5.3248291015625, -5.11181640625, -4.8988037109375, -4.685791015625, -4.4727783203125, -4.259765625, -4.0467529296875, -3.833740234375, -3.6207275390625, -3.40771484375, -3.1947021484375, -2.981689453125, -2.7686767578125, -2.5556640625, -2.3426513671875, -2.129638671875, -1.9166259765625, -1.70361328125, -1.4906005859375, -1.277587890625, -1.0645751953125, -0.8515625, -0.6385498046875, -0.425537109375, -0.2125244140625, 0.00048828125, 0.2135009765625, 0.426513671875, 0.6395263671875, 0.8525390625, 1.0655517578125, 1.278564453125, 1.4915771484375, 1.70458984375, 1.9176025390625, 2.130615234375, 2.3436279296875, 2.556640625, 2.7696533203125, 2.982666015625, 3.1956787109375, 3.40869140625, 3.6217041015625, 3.834716796875, 4.0477294921875, 4.2607421875, 4.4737548828125, 4.686767578125, 4.8997802734375, 5.11279296875, 5.3258056640625, 5.538818359375, 5.7518310546875, 5.96484375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 13.0, 12.0, 37.0, 47.0, 67.0, 67.0, 127.0, 105.0, 118.0, 123.0, 72.0, 63.0, 57.0, 34.0, 22.0, 9.0, 19.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6953125, -3.5123291015625, -3.329345703125, -3.1463623046875, -2.96337890625, -2.7803955078125, -2.597412109375, -2.4144287109375, -2.2314453125, -2.0484619140625, -1.865478515625, -1.6824951171875, -1.49951171875, -1.3165283203125, -1.133544921875, -0.9505615234375, -0.767578125, -0.5845947265625, -0.401611328125, -0.2186279296875, -0.03564453125, 0.1473388671875, 0.330322265625, 0.5133056640625, 0.6962890625, 0.8792724609375, 1.062255859375, 1.2452392578125, 1.42822265625, 1.6112060546875, 1.794189453125, 1.9771728515625, 2.16015625, 2.3431396484375, 2.526123046875, 2.7091064453125, 2.89208984375, 3.0750732421875, 3.258056640625, 3.4410400390625, 3.6240234375, 3.8070068359375, 3.989990234375, 4.1729736328125, 4.35595703125, 4.5389404296875, 4.721923828125, 4.9049072265625, 5.087890625, 5.2708740234375, 5.453857421875, 5.6368408203125, 5.81982421875, 6.0028076171875, 6.185791015625, 6.3687744140625, 6.5517578125, 6.7347412109375, 6.917724609375, 7.1007080078125, 7.28369140625, 7.4666748046875, 7.649658203125, 7.8326416015625, 8.015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 5.0, 5.0, 14.0, 12.0, 12.0, 29.0, 41.0, 63.0, 92.0, 216.0, 505.0, 2186.0, 25646.0, 3615097.0, 540150.0, 8323.0, 1168.0, 327.0, 148.0, 76.0, 61.0, 37.0, 33.0, 17.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.15625, -17.71142578125, -17.2666015625, -16.82177734375, -16.376953125, -15.93212890625, -15.4873046875, -15.04248046875, -14.59765625, -14.15283203125, -13.7080078125, -13.26318359375, -12.818359375, -12.37353515625, -11.9287109375, -11.48388671875, -11.0390625, -10.59423828125, -10.1494140625, -9.70458984375, -9.259765625, -8.81494140625, -8.3701171875, -7.92529296875, -7.48046875, -7.03564453125, -6.5908203125, -6.14599609375, -5.701171875, -5.25634765625, -4.8115234375, -4.36669921875, -3.921875, -3.47705078125, -3.0322265625, -2.58740234375, -2.142578125, -1.69775390625, -1.2529296875, -0.80810546875, -0.36328125, 0.08154296875, 0.5263671875, 0.97119140625, 1.416015625, 1.86083984375, 2.3056640625, 2.75048828125, 3.1953125, 3.64013671875, 4.0849609375, 4.52978515625, 4.974609375, 5.41943359375, 5.8642578125, 6.30908203125, 6.75390625, 7.19873046875, 7.6435546875, 8.08837890625, 8.533203125, 8.97802734375, 9.4228515625, 9.86767578125, 10.3125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 9.0, 5.0, 14.0, 18.0, 18.0, 35.0, 48.0, 87.0, 138.0, 197.0, 369.0, 610.0, 788.0, 657.0, 424.0, 254.0, 153.0, 85.0, 45.0, 30.0, 21.0, 19.0, 12.0, 11.0, 8.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.609375, -6.400146484375, -6.19091796875, -5.981689453125, -5.7724609375, -5.563232421875, -5.35400390625, -5.144775390625, -4.935546875, -4.726318359375, -4.51708984375, -4.307861328125, -4.0986328125, -3.889404296875, -3.68017578125, -3.470947265625, -3.26171875, -3.052490234375, -2.84326171875, -2.634033203125, -2.4248046875, -2.215576171875, -2.00634765625, -1.797119140625, -1.587890625, -1.378662109375, -1.16943359375, -0.960205078125, -0.7509765625, -0.541748046875, -0.33251953125, -0.123291015625, 0.0859375, 0.295166015625, 0.50439453125, 0.713623046875, 0.9228515625, 1.132080078125, 1.34130859375, 1.550537109375, 1.759765625, 1.968994140625, 2.17822265625, 2.387451171875, 2.5966796875, 2.805908203125, 3.01513671875, 3.224365234375, 3.43359375, 3.642822265625, 3.85205078125, 4.061279296875, 4.2705078125, 4.479736328125, 4.68896484375, 4.898193359375, 5.107421875, 5.316650390625, 5.52587890625, 5.735107421875, 5.9443359375, 6.153564453125, 6.36279296875, 6.572021484375, 6.78125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 13.0, 24.0, 43.0, 97.0, 164.0, 241.0, 190.0, 128.0, 56.0, 26.0, 12.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-121.83629608154297, -119.33831787109375, -116.84033203125, -114.34235382080078, -111.84437561035156, -109.34639739990234, -106.84841918945312, -104.35043334960938, -101.85245513916016, -99.35447692871094, -96.85649108886719, -94.35851287841797, -91.86053466796875, -89.36255645751953, -86.86457824707031, -84.36659240722656, -81.86861419677734, -79.37063598632812, -76.87265014648438, -74.37467193603516, -71.87669372558594, -69.37871551513672, -66.8807373046875, -64.38275146484375, -61.88477325439453, -59.38679504394531, -56.88881301879883, -54.390830993652344, -51.892852783203125, -49.394874572753906, -46.89689254760742, -44.39891052246094, -41.90092849731445, -39.40294647216797, -36.90496826171875, -34.40699005126953, -31.909008026123047, -29.411027908325195, -26.913047790527344, -24.415067672729492, -21.91708755493164, -19.41910743713379, -16.921127319335938, -14.423147201538086, -11.925167083740234, -9.427186965942383, -6.929206848144531, -4.43122673034668, -1.9332466125488281, 0.5647335052490234, 3.062713623046875, 5.560693740844727, 8.058673858642578, 10.55665397644043, 13.054634094238281, 15.552614212036133, 18.050594329833984, 20.548574447631836, 23.046554565429688, 25.54453468322754, 28.04251480102539, 30.540494918823242, 33.038475036621094, 35.53645324707031, 38.0344352722168]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 6.0, 8.0, 2.0, 11.0, 13.0, 18.0, 17.0, 26.0, 22.0, 24.0, 21.0, 24.0, 32.0, 37.0, 36.0, 40.0, 54.0, 42.0, 48.0, 48.0, 55.0, 41.0, 49.0, 41.0, 30.0, 35.0, 23.0, 26.0, 22.0, 20.0, 17.0, 22.0, 23.0, 16.0, 10.0, 8.0, 10.0, 4.0, 2.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-23.685802459716797, -22.985179901123047, -22.284557342529297, -21.58393669128418, -20.88331413269043, -20.18269157409668, -19.482070922851562, -18.781448364257812, -18.080825805664062, -17.380203247070312, -16.679580688476562, -15.978960037231445, -15.278337478637695, -14.577714920043945, -13.877093315124512, -13.176471710205078, -12.475849151611328, -11.775226593017578, -11.074604988098145, -10.373983383178711, -9.673360824584961, -8.972738265991211, -8.272116661071777, -7.5714945793151855, -6.870872497558594, -6.170250415802002, -5.46962833404541, -4.769006252288818, -4.068384170532227, -3.3677620887756348, -2.667140007019043, -1.9665179252624512, -1.2658958435058594, -0.5652737617492676, 0.13534832000732422, 0.835970401763916, 1.5365924835205078, 2.2372145652770996, 2.9378366470336914, 3.638458728790283, 4.339080810546875, 5.039702892303467, 5.740324974060059, 6.44094705581665, 7.141569137573242, 7.842191219329834, 8.542813301086426, 9.24343490600586, 9.94405746459961, 10.64468002319336, 11.345301628112793, 12.045923233032227, 12.746545791625977, 13.447168350219727, 14.14778995513916, 14.848411560058594, 15.549034118652344, 16.249656677246094, 16.950279235839844, 17.65089988708496, 18.35152244567871, 19.05214500427246, 19.752765655517578, 20.453388214111328, 21.154010772705078]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 18.0, 39.0, 42.0, 135.0, 306.0, 801.0, 2818.0, 12663.0, 96119.0, 697303.0, 209791.0, 22262.0, 4227.0, 1191.0, 445.0, 166.0, 84.0, 53.0, 23.0, 15.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40234375, -6.16217041015625, -5.9219970703125, -5.68182373046875, -5.441650390625, -5.20147705078125, -4.9613037109375, -4.72113037109375, -4.48095703125, -4.24078369140625, -4.0006103515625, -3.76043701171875, -3.520263671875, -3.28009033203125, -3.0399169921875, -2.79974365234375, -2.5595703125, -2.31939697265625, -2.0792236328125, -1.83905029296875, -1.598876953125, -1.35870361328125, -1.1185302734375, -0.87835693359375, -0.63818359375, -0.39801025390625, -0.1578369140625, 0.08233642578125, 0.322509765625, 0.56268310546875, 0.8028564453125, 1.04302978515625, 1.283203125, 1.52337646484375, 1.7635498046875, 2.00372314453125, 2.243896484375, 2.48406982421875, 2.7242431640625, 2.96441650390625, 3.20458984375, 3.44476318359375, 3.6849365234375, 3.92510986328125, 4.165283203125, 4.40545654296875, 4.6456298828125, 4.88580322265625, 5.1259765625, 5.36614990234375, 5.6063232421875, 5.84649658203125, 6.086669921875, 6.32684326171875, 6.5670166015625, 6.80718994140625, 7.04736328125, 7.28753662109375, 7.5277099609375, 7.76788330078125, 8.008056640625, 8.24822998046875, 8.4884033203125, 8.72857666015625, 8.96875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 11.0, 17.0, 24.0, 27.0, 32.0, 45.0, 50.0, 66.0, 80.0, 84.0, 87.0, 69.0, 75.0, 66.0, 74.0, 48.0, 38.0, 32.0, 18.0, 15.0, 17.0, 4.0, 9.0, 3.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6796875, -3.53668212890625, -3.3936767578125, -3.25067138671875, -3.107666015625, -2.96466064453125, -2.8216552734375, -2.67864990234375, -2.53564453125, -2.39263916015625, -2.2496337890625, -2.10662841796875, -1.963623046875, -1.82061767578125, -1.6776123046875, -1.53460693359375, -1.3916015625, -1.24859619140625, -1.1055908203125, -0.96258544921875, -0.819580078125, -0.67657470703125, -0.5335693359375, -0.39056396484375, -0.24755859375, -0.10455322265625, 0.0384521484375, 0.18145751953125, 0.324462890625, 0.46746826171875, 0.6104736328125, 0.75347900390625, 0.896484375, 1.03948974609375, 1.1824951171875, 1.32550048828125, 1.468505859375, 1.61151123046875, 1.7545166015625, 1.89752197265625, 2.04052734375, 2.18353271484375, 2.3265380859375, 2.46954345703125, 2.612548828125, 2.75555419921875, 2.8985595703125, 3.04156494140625, 3.1845703125, 3.32757568359375, 3.4705810546875, 3.61358642578125, 3.756591796875, 3.89959716796875, 4.0426025390625, 4.18560791015625, 4.32861328125, 4.47161865234375, 4.6146240234375, 4.75762939453125, 4.900634765625, 5.04364013671875, 5.1866455078125, 5.32965087890625, 5.47265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 12.0, 2.0, 10.0, 14.0, 19.0, 23.0, 24.0, 40.0, 58.0, 84.0, 107.0, 160.0, 238.0, 396.0, 741.0, 1718.0, 4666.0, 17705.0, 101457.0, 718093.0, 166600.0, 25624.0, 6335.0, 2209.0, 883.0, 457.0, 308.0, 160.0, 105.0, 71.0, 63.0, 48.0, 24.0, 29.0, 19.0, 19.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.88671875, -6.681884765625, -6.47705078125, -6.272216796875, -6.0673828125, -5.862548828125, -5.65771484375, -5.452880859375, -5.248046875, -5.043212890625, -4.83837890625, -4.633544921875, -4.4287109375, -4.223876953125, -4.01904296875, -3.814208984375, -3.609375, -3.404541015625, -3.19970703125, -2.994873046875, -2.7900390625, -2.585205078125, -2.38037109375, -2.175537109375, -1.970703125, -1.765869140625, -1.56103515625, -1.356201171875, -1.1513671875, -0.946533203125, -0.74169921875, -0.536865234375, -0.33203125, -0.127197265625, 0.07763671875, 0.282470703125, 0.4873046875, 0.692138671875, 0.89697265625, 1.101806640625, 1.306640625, 1.511474609375, 1.71630859375, 1.921142578125, 2.1259765625, 2.330810546875, 2.53564453125, 2.740478515625, 2.9453125, 3.150146484375, 3.35498046875, 3.559814453125, 3.7646484375, 3.969482421875, 4.17431640625, 4.379150390625, 4.583984375, 4.788818359375, 4.99365234375, 5.198486328125, 5.4033203125, 5.608154296875, 5.81298828125, 6.017822265625, 6.22265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 3.0, 9.0, 7.0, 18.0, 9.0, 15.0, 18.0, 28.0, 16.0, 41.0, 36.0, 35.0, 51.0, 49.0, 54.0, 59.0, 57.0, 57.0, 49.0, 51.0, 38.0, 58.0, 38.0, 21.0, 36.0, 23.0, 9.0, 15.0, 13.0, 13.0, 9.0, 7.0, 4.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.0625, -10.70947265625, -10.3564453125, -10.00341796875, -9.650390625, -9.29736328125, -8.9443359375, -8.59130859375, -8.23828125, -7.88525390625, -7.5322265625, -7.17919921875, -6.826171875, -6.47314453125, -6.1201171875, -5.76708984375, -5.4140625, -5.06103515625, -4.7080078125, -4.35498046875, -4.001953125, -3.64892578125, -3.2958984375, -2.94287109375, -2.58984375, -2.23681640625, -1.8837890625, -1.53076171875, -1.177734375, -0.82470703125, -0.4716796875, -0.11865234375, 0.234375, 0.58740234375, 0.9404296875, 1.29345703125, 1.646484375, 1.99951171875, 2.3525390625, 2.70556640625, 3.05859375, 3.41162109375, 3.7646484375, 4.11767578125, 4.470703125, 4.82373046875, 5.1767578125, 5.52978515625, 5.8828125, 6.23583984375, 6.5888671875, 6.94189453125, 7.294921875, 7.64794921875, 8.0009765625, 8.35400390625, 8.70703125, 9.06005859375, 9.4130859375, 9.76611328125, 10.119140625, 10.47216796875, 10.8251953125, 11.17822265625, 11.53125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 4.0, 5.0, 14.0, 13.0, 21.0, 16.0, 26.0, 47.0, 48.0, 81.0, 101.0, 183.0, 293.0, 442.0, 725.0, 1151.0, 2055.0, 3910.0, 8026.0, 17129.0, 40295.0, 114260.0, 594677.0, 168858.0, 53851.0, 21737.0, 9698.0, 4805.0, 2486.0, 1352.0, 790.0, 475.0, 311.0, 223.0, 122.0, 82.0, 72.0, 46.0, 43.0, 20.0, 13.0, 12.0, 5.0, 5.0, 5.0, 2.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.623046875, -1.573333740234375, -1.52362060546875, -1.473907470703125, -1.4241943359375, -1.374481201171875, -1.32476806640625, -1.275054931640625, -1.225341796875, -1.175628662109375, -1.12591552734375, -1.076202392578125, -1.0264892578125, -0.976776123046875, -0.92706298828125, -0.877349853515625, -0.82763671875, -0.777923583984375, -0.72821044921875, -0.678497314453125, -0.6287841796875, -0.579071044921875, -0.52935791015625, -0.479644775390625, -0.429931640625, -0.380218505859375, -0.33050537109375, -0.280792236328125, -0.2310791015625, -0.181365966796875, -0.13165283203125, -0.081939697265625, -0.0322265625, 0.017486572265625, 0.06719970703125, 0.116912841796875, 0.1666259765625, 0.216339111328125, 0.26605224609375, 0.315765380859375, 0.365478515625, 0.415191650390625, 0.46490478515625, 0.514617919921875, 0.5643310546875, 0.614044189453125, 0.66375732421875, 0.713470458984375, 0.76318359375, 0.812896728515625, 0.86260986328125, 0.912322998046875, 0.9620361328125, 1.011749267578125, 1.06146240234375, 1.111175537109375, 1.160888671875, 1.210601806640625, 1.26031494140625, 1.310028076171875, 1.3597412109375, 1.409454345703125, 1.45916748046875, 1.508880615234375, 1.55859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 5.0, 2.0, 6.0, 7.0, 7.0, 12.0, 17.0, 23.0, 23.0, 38.0, 49.0, 76.0, 107.0, 136.0, 139.0, 98.0, 58.0, 46.0, 44.0, 13.0, 16.0, 16.0, 8.0, 10.0, 7.0, 2.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006804466247558594, -0.0006590709090232849, -0.0006376951932907104, -0.000616319477558136, -0.0005949437618255615, -0.0005735680460929871, -0.0005521923303604126, -0.0005308166146278381, -0.0005094408988952637, -0.0004880651831626892, -0.00046668946743011475, -0.0004453137516975403, -0.0004239380359649658, -0.00040256232023239136, -0.0003811866044998169, -0.00035981088876724243, -0.00033843517303466797, -0.0003170594573020935, -0.00029568374156951904, -0.0002743080258369446, -0.0002529323101043701, -0.00023155659437179565, -0.0002101808786392212, -0.00018880516290664673, -0.00016742944717407227, -0.0001460537314414978, -0.00012467801570892334, -0.00010330229997634888, -8.192658424377441e-05, -6.055086851119995e-05, -3.917515277862549e-05, -1.7799437046051025e-05, 3.5762786865234375e-06, 2.49519944190979e-05, 4.632771015167236e-05, 6.770342588424683e-05, 8.907914161682129e-05, 0.00011045485734939575, 0.00013183057308197021, 0.00015320628881454468, 0.00017458200454711914, 0.0001959577202796936, 0.00021733343601226807, 0.00023870915174484253, 0.000260084867477417, 0.00028146058320999146, 0.0003028362989425659, 0.0003242120146751404, 0.00034558773040771484, 0.0003669634461402893, 0.00038833916187286377, 0.00040971487760543823, 0.0004310905933380127, 0.00045246630907058716, 0.0004738420248031616, 0.0004952177405357361, 0.0005165934562683105, 0.000537969172000885, 0.0005593448877334595, 0.0005807206034660339, 0.0006020963191986084, 0.0006234720349311829, 0.0006448477506637573, 0.0006662234663963318, 0.0006875991821289062]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 7.0, 16.0, 29.0, 35.0, 53.0, 84.0, 135.0, 211.0, 364.0, 688.0, 1347.0, 2695.0, 6197.0, 16005.0, 47920.0, 197292.0, 635633.0, 94113.0, 27524.0, 9920.0, 4151.0, 1914.0, 905.0, 514.0, 268.0, 195.0, 101.0, 68.0, 43.0, 37.0, 21.0, 14.0, 8.0, 11.0, 8.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.370269775390625, -2.30108642578125, -2.231903076171875, -2.1627197265625, -2.093536376953125, -2.02435302734375, -1.955169677734375, -1.885986328125, -1.816802978515625, -1.74761962890625, -1.678436279296875, -1.6092529296875, -1.540069580078125, -1.47088623046875, -1.401702880859375, -1.33251953125, -1.263336181640625, -1.19415283203125, -1.124969482421875, -1.0557861328125, -0.986602783203125, -0.91741943359375, -0.848236083984375, -0.779052734375, -0.709869384765625, -0.64068603515625, -0.571502685546875, -0.5023193359375, -0.433135986328125, -0.36395263671875, -0.294769287109375, -0.2255859375, -0.156402587890625, -0.08721923828125, -0.018035888671875, 0.0511474609375, 0.120330810546875, 0.18951416015625, 0.258697509765625, 0.327880859375, 0.397064208984375, 0.46624755859375, 0.535430908203125, 0.6046142578125, 0.673797607421875, 0.74298095703125, 0.812164306640625, 0.88134765625, 0.950531005859375, 1.01971435546875, 1.088897705078125, 1.1580810546875, 1.227264404296875, 1.29644775390625, 1.365631103515625, 1.434814453125, 1.503997802734375, 1.57318115234375, 1.642364501953125, 1.7115478515625, 1.780731201171875, 1.84991455078125, 1.919097900390625, 1.98828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 7.0, 5.0, 16.0, 9.0, 22.0, 16.0, 30.0, 35.0, 38.0, 48.0, 88.0, 100.0, 97.0, 95.0, 76.0, 69.0, 49.0, 45.0, 24.0, 20.0, 16.0, 20.0, 11.0, 15.0, 9.0, 9.0, 4.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.005859375, -1.93359375, -1.861328125, -1.7890625, -1.716796875, -1.64453125, -1.572265625, -1.5, -1.427734375, -1.35546875, -1.283203125, -1.2109375, -1.138671875, -1.06640625, -0.994140625, -0.921875, -0.849609375, -0.77734375, -0.705078125, -0.6328125, -0.560546875, -0.48828125, -0.416015625, -0.34375, -0.271484375, -0.19921875, -0.126953125, -0.0546875, 0.017578125, 0.08984375, 0.162109375, 0.234375, 0.306640625, 0.37890625, 0.451171875, 0.5234375, 0.595703125, 0.66796875, 0.740234375, 0.8125, 0.884765625, 0.95703125, 1.029296875, 1.1015625, 1.173828125, 1.24609375, 1.318359375, 1.390625, 1.462890625, 1.53515625, 1.607421875, 1.6796875, 1.751953125, 1.82421875, 1.896484375, 1.96875, 2.041015625, 2.11328125, 2.185546875, 2.2578125, 2.330078125, 2.40234375, 2.474609375, 2.546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 9.0, 17.0, 42.0, 90.0, 325.0, 297.0, 136.0, 50.0, 15.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.891357421875, -85.1408462524414, -82.39033508300781, -79.63982391357422, -76.88931274414062, -74.13880157470703, -71.38829040527344, -68.63778686523438, -65.88726806640625, -63.136756896972656, -60.38624572753906, -57.63573455810547, -54.885223388671875, -52.13471221923828, -49.38420486450195, -46.63369369506836, -43.88318634033203, -41.13267517089844, -38.382164001464844, -35.63165283203125, -32.881141662597656, -30.130632400512695, -27.380123138427734, -24.62961196899414, -21.879100799560547, -19.128589630126953, -16.37807846069336, -13.627569198608398, -10.877058029174805, -8.126546859741211, -5.37603759765625, -2.6255264282226562, 0.12497711181640625, 2.875487804412842, 5.625998497009277, 8.376508712768555, 11.127019882202148, 13.877531051635742, 16.628040313720703, 19.378551483154297, 22.12906265258789, 24.879573822021484, 27.630084991455078, 30.38059425354004, 33.131103515625, 35.881614685058594, 38.63212585449219, 41.38263702392578, 44.133148193359375, 46.88365936279297, 49.63417053222656, 52.384681701660156, 55.13519287109375, 57.885704040527344, 60.63621139526367, 63.386722564697266, 66.13723754882812, 68.88774871826172, 71.63825988769531, 74.3887710571289, 77.1392822265625, 79.8897933959961, 82.64030456542969, 85.39080810546875, 88.14131927490234]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 10.0, 7.0, 12.0, 14.0, 13.0, 16.0, 22.0, 17.0, 25.0, 18.0, 31.0, 27.0, 24.0, 31.0, 43.0, 63.0, 89.0, 85.0, 94.0, 48.0, 30.0, 26.0, 20.0, 20.0, 27.0, 28.0, 21.0, 25.0, 13.0, 21.0, 10.0, 5.0, 14.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-44.07929229736328, -42.7523307800293, -41.42536926269531, -40.09840774536133, -38.771446228027344, -37.444480895996094, -36.11751937866211, -34.790557861328125, -33.46359634399414, -32.136634826660156, -30.809673309326172, -29.482709884643555, -28.15574836730957, -26.828786849975586, -25.50182342529297, -24.174861907958984, -22.847900390625, -21.520938873291016, -20.19397735595703, -18.867013931274414, -17.54005241394043, -16.213090896606445, -14.886128425598145, -13.559165954589844, -12.23220443725586, -10.905242919921875, -9.578280448913574, -8.251317977905273, -6.924356460571289, -5.5973944664001465, -4.270432472229004, -2.943470001220703, -1.6165084838867188, -0.28954648971557617, 1.0374155044555664, 2.364377498626709, 3.6913394927978516, 5.018301486968994, 6.345263481140137, 7.6722259521484375, 8.999187469482422, 10.326148986816406, 11.653111457824707, 12.980073928833008, 14.307035446166992, 15.633996963500977, 16.960960388183594, 18.287921905517578, 19.614883422851562, 20.941844940185547, 22.26880645751953, 23.59576988220215, 24.922731399536133, 26.249692916870117, 27.576656341552734, 28.90361785888672, 30.230579376220703, 31.557540893554688, 32.88450241088867, 34.211463928222656, 35.538429260253906, 36.86539077758789, 38.192352294921875, 39.51931381225586, 40.846275329589844]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0, 5.0, 9.0, 15.0, 19.0, 18.0, 29.0, 34.0, 56.0, 51.0, 113.0, 191.0, 325.0, 615.0, 1264.0, 2784.0, 7661.0, 28149.0, 160520.0, 1366398.0, 2246997.0, 311114.0, 47172.0, 12208.0, 4355.0, 1954.0, 902.0, 516.0, 285.0, 160.0, 106.0, 84.0, 44.0, 45.0, 21.0, 20.0, 8.0, 12.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.03125, -4.89208984375, -4.7529296875, -4.61376953125, -4.474609375, -4.33544921875, -4.1962890625, -4.05712890625, -3.91796875, -3.77880859375, -3.6396484375, -3.50048828125, -3.361328125, -3.22216796875, -3.0830078125, -2.94384765625, -2.8046875, -2.66552734375, -2.5263671875, -2.38720703125, -2.248046875, -2.10888671875, -1.9697265625, -1.83056640625, -1.69140625, -1.55224609375, -1.4130859375, -1.27392578125, -1.134765625, -0.99560546875, -0.8564453125, -0.71728515625, -0.578125, -0.43896484375, -0.2998046875, -0.16064453125, -0.021484375, 0.11767578125, 0.2568359375, 0.39599609375, 0.53515625, 0.67431640625, 0.8134765625, 0.95263671875, 1.091796875, 1.23095703125, 1.3701171875, 1.50927734375, 1.6484375, 1.78759765625, 1.9267578125, 2.06591796875, 2.205078125, 2.34423828125, 2.4833984375, 2.62255859375, 2.76171875, 2.90087890625, 3.0400390625, 3.17919921875, 3.318359375, 3.45751953125, 3.5966796875, 3.73583984375, 3.875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 1.0, 7.0, 6.0, 8.0, 17.0, 22.0, 17.0, 21.0, 31.0, 36.0, 28.0, 52.0, 40.0, 45.0, 39.0, 54.0, 41.0, 68.0, 42.0, 51.0, 50.0, 48.0, 43.0, 26.0, 33.0, 25.0, 28.0, 25.0, 21.0, 13.0, 17.0, 10.0, 7.0, 1.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2265625, -3.133056640625, -3.03955078125, -2.946044921875, -2.8525390625, -2.759033203125, -2.66552734375, -2.572021484375, -2.478515625, -2.385009765625, -2.29150390625, -2.197998046875, -2.1044921875, -2.010986328125, -1.91748046875, -1.823974609375, -1.73046875, -1.636962890625, -1.54345703125, -1.449951171875, -1.3564453125, -1.262939453125, -1.16943359375, -1.075927734375, -0.982421875, -0.888916015625, -0.79541015625, -0.701904296875, -0.6083984375, -0.514892578125, -0.42138671875, -0.327880859375, -0.234375, -0.140869140625, -0.04736328125, 0.046142578125, 0.1396484375, 0.233154296875, 0.32666015625, 0.420166015625, 0.513671875, 0.607177734375, 0.70068359375, 0.794189453125, 0.8876953125, 0.981201171875, 1.07470703125, 1.168212890625, 1.26171875, 1.355224609375, 1.44873046875, 1.542236328125, 1.6357421875, 1.729248046875, 1.82275390625, 1.916259765625, 2.009765625, 2.103271484375, 2.19677734375, 2.290283203125, 2.3837890625, 2.477294921875, 2.57080078125, 2.664306640625, 2.7578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 8.0, 12.0, 23.0, 20.0, 45.0, 83.0, 168.0, 341.0, 998.0, 4397.0, 46957.0, 3424162.0, 696541.0, 16830.0, 2432.0, 709.0, 255.0, 129.0, 66.0, 28.0, 15.0, 19.0, 8.0, 6.0, 6.0, 1.0, 4.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.59375, -13.2244873046875, -12.855224609375, -12.4859619140625, -12.11669921875, -11.7474365234375, -11.378173828125, -11.0089111328125, -10.6396484375, -10.2703857421875, -9.901123046875, -9.5318603515625, -9.16259765625, -8.7933349609375, -8.424072265625, -8.0548095703125, -7.685546875, -7.3162841796875, -6.947021484375, -6.5777587890625, -6.20849609375, -5.8392333984375, -5.469970703125, -5.1007080078125, -4.7314453125, -4.3621826171875, -3.992919921875, -3.6236572265625, -3.25439453125, -2.8851318359375, -2.515869140625, -2.1466064453125, -1.77734375, -1.4080810546875, -1.038818359375, -0.6695556640625, -0.30029296875, 0.0689697265625, 0.438232421875, 0.8074951171875, 1.1767578125, 1.5460205078125, 1.915283203125, 2.2845458984375, 2.65380859375, 3.0230712890625, 3.392333984375, 3.7615966796875, 4.130859375, 4.5001220703125, 4.869384765625, 5.2386474609375, 5.60791015625, 5.9771728515625, 6.346435546875, 6.7156982421875, 7.0849609375, 7.4542236328125, 7.823486328125, 8.1927490234375, 8.56201171875, 8.9312744140625, 9.300537109375, 9.6697998046875, 10.0390625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 10.0, 13.0, 25.0, 28.0, 62.0, 95.0, 112.0, 197.0, 337.0, 520.0, 712.0, 634.0, 489.0, 319.0, 161.0, 128.0, 63.0, 43.0, 30.0, 24.0, 12.0, 9.0, 13.0, 8.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3515625, -6.1380615234375, -5.924560546875, -5.7110595703125, -5.49755859375, -5.2840576171875, -5.070556640625, -4.8570556640625, -4.6435546875, -4.4300537109375, -4.216552734375, -4.0030517578125, -3.78955078125, -3.5760498046875, -3.362548828125, -3.1490478515625, -2.935546875, -2.7220458984375, -2.508544921875, -2.2950439453125, -2.08154296875, -1.8680419921875, -1.654541015625, -1.4410400390625, -1.2275390625, -1.0140380859375, -0.800537109375, -0.5870361328125, -0.37353515625, -0.1600341796875, 0.053466796875, 0.2669677734375, 0.48046875, 0.6939697265625, 0.907470703125, 1.1209716796875, 1.33447265625, 1.5479736328125, 1.761474609375, 1.9749755859375, 2.1884765625, 2.4019775390625, 2.615478515625, 2.8289794921875, 3.04248046875, 3.2559814453125, 3.469482421875, 3.6829833984375, 3.896484375, 4.1099853515625, 4.323486328125, 4.5369873046875, 4.75048828125, 4.9639892578125, 5.177490234375, 5.3909912109375, 5.6044921875, 5.8179931640625, 6.031494140625, 6.2449951171875, 6.45849609375, 6.6719970703125, 6.885498046875, 7.0989990234375, 7.3125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 11.0, 24.0, 87.0, 148.0, 268.0, 219.0, 132.0, 57.0, 20.0, 10.0, 8.0, 7.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.01286315917969, -41.247127532958984, -38.48139190673828, -35.715660095214844, -32.949920654296875, -30.184186935424805, -27.418453216552734, -24.65271759033203, -21.886981964111328, -19.121246337890625, -16.355510711669922, -13.589776992797852, -10.824041366577148, -8.058305740356445, -5.292572021484375, -2.526836395263672, 0.23889923095703125, 3.004634380340576, 5.770369529724121, 8.536104202270508, 11.301839828491211, 14.067575454711914, 16.833309173583984, 19.599044799804688, 22.36478042602539, 25.130516052246094, 27.896251678466797, 30.661985397338867, 33.42771911621094, 36.193458557128906, 38.959190368652344, 41.72492599487305, 44.49066162109375, 47.25639724731445, 50.022132873535156, 52.787864685058594, 55.55360412597656, 58.3193359375, 61.0850715637207, 63.850807189941406, 66.61654663085938, 69.38227844238281, 72.14801788330078, 74.91374969482422, 77.67948913574219, 80.44522094726562, 83.21095275878906, 85.97669219970703, 88.74242401123047, 91.5081558227539, 94.27389526367188, 97.03962707519531, 99.80536651611328, 102.57109832763672, 105.33683776855469, 108.10256958007812, 110.86830139160156, 113.634033203125, 116.39977264404297, 119.1655044555664, 121.93124389648438, 124.69697570800781, 127.46270751953125, 130.22845458984375, 132.9941864013672]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 9.0, 9.0, 16.0, 12.0, 15.0, 22.0, 30.0, 22.0, 32.0, 31.0, 32.0, 35.0, 35.0, 47.0, 51.0, 41.0, 50.0, 47.0, 35.0, 37.0, 50.0, 42.0, 38.0, 39.0, 36.0, 29.0, 24.0, 21.0, 24.0, 12.0, 15.0, 11.0, 11.0, 7.0, 8.0, 4.0, 2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-28.750947952270508, -27.919124603271484, -27.08730125427246, -26.255477905273438, -25.423656463623047, -24.59183120727539, -23.760009765625, -22.928186416625977, -22.096363067626953, -21.26453971862793, -20.432716369628906, -19.600893020629883, -18.76906967163086, -17.93724822998047, -17.105424880981445, -16.273601531982422, -15.441778182983398, -14.609954833984375, -13.778131484985352, -12.946309089660645, -12.114485740661621, -11.282662391662598, -10.45083999633789, -9.619016647338867, -8.787193298339844, -7.95536994934082, -7.123547077178955, -6.29172420501709, -5.459900856018066, -4.628077507019043, -3.7962546348571777, -2.9644317626953125, -2.132608413696289, -1.3007853031158447, -0.4689621925354004, 0.36286091804504395, 1.1946840286254883, 2.0265073776245117, 2.858330249786377, 3.690153121948242, 4.521976470947266, 5.353799819946289, 6.185622692108154, 7.0174455642700195, 7.849268913269043, 8.681092262268066, 9.512914657592773, 10.344738006591797, 11.17656135559082, 12.008384704589844, 12.840208053588867, 13.672030448913574, 14.503853797912598, 15.335677146911621, 16.167499542236328, 16.99932289123535, 17.831146240234375, 18.6629695892334, 19.494792938232422, 20.326616287231445, 21.15843963623047, 21.99026107788086, 22.822084426879883, 23.653907775878906, 24.48573112487793]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 9.0, 5.0, 12.0, 24.0, 25.0, 30.0, 94.0, 208.0, 427.0, 1026.0, 3038.0, 10944.0, 54065.0, 400733.0, 491622.0, 67627.0, 13054.0, 3474.0, 1179.0, 501.0, 201.0, 92.0, 57.0, 40.0, 22.0, 16.0, 9.0, 11.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.98046875, -7.76513671875, -7.5498046875, -7.33447265625, -7.119140625, -6.90380859375, -6.6884765625, -6.47314453125, -6.2578125, -6.04248046875, -5.8271484375, -5.61181640625, -5.396484375, -5.18115234375, -4.9658203125, -4.75048828125, -4.53515625, -4.31982421875, -4.1044921875, -3.88916015625, -3.673828125, -3.45849609375, -3.2431640625, -3.02783203125, -2.8125, -2.59716796875, -2.3818359375, -2.16650390625, -1.951171875, -1.73583984375, -1.5205078125, -1.30517578125, -1.08984375, -0.87451171875, -0.6591796875, -0.44384765625, -0.228515625, -0.01318359375, 0.2021484375, 0.41748046875, 0.6328125, 0.84814453125, 1.0634765625, 1.27880859375, 1.494140625, 1.70947265625, 1.9248046875, 2.14013671875, 2.35546875, 2.57080078125, 2.7861328125, 3.00146484375, 3.216796875, 3.43212890625, 3.6474609375, 3.86279296875, 4.078125, 4.29345703125, 4.5087890625, 4.72412109375, 4.939453125, 5.15478515625, 5.3701171875, 5.58544921875, 5.80078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 9.0, 13.0, 19.0, 17.0, 29.0, 26.0, 43.0, 46.0, 65.0, 52.0, 61.0, 65.0, 66.0, 64.0, 55.0, 58.0, 69.0, 34.0, 43.0, 37.0, 30.0, 24.0, 18.0, 21.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.69921875, -4.570159912109375, -4.44110107421875, -4.312042236328125, -4.1829833984375, -4.053924560546875, -3.92486572265625, -3.795806884765625, -3.666748046875, -3.537689208984375, -3.40863037109375, -3.279571533203125, -3.1505126953125, -3.021453857421875, -2.89239501953125, -2.763336181640625, -2.63427734375, -2.505218505859375, -2.37615966796875, -2.247100830078125, -2.1180419921875, -1.988983154296875, -1.85992431640625, -1.730865478515625, -1.601806640625, -1.472747802734375, -1.34368896484375, -1.214630126953125, -1.0855712890625, -0.956512451171875, -0.82745361328125, -0.698394775390625, -0.5693359375, -0.440277099609375, -0.31121826171875, -0.182159423828125, -0.0531005859375, 0.075958251953125, 0.20501708984375, 0.334075927734375, 0.463134765625, 0.592193603515625, 0.72125244140625, 0.850311279296875, 0.9793701171875, 1.108428955078125, 1.23748779296875, 1.366546630859375, 1.49560546875, 1.624664306640625, 1.75372314453125, 1.882781982421875, 2.0118408203125, 2.140899658203125, 2.26995849609375, 2.399017333984375, 2.528076171875, 2.657135009765625, 2.78619384765625, 2.915252685546875, 3.0443115234375, 3.173370361328125, 3.30242919921875, 3.431488037109375, 3.560546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 14.0, 22.0, 16.0, 27.0, 44.0, 57.0, 106.0, 161.0, 199.0, 394.0, 647.0, 1473.0, 3531.0, 12102.0, 71347.0, 773262.0, 155786.0, 20275.0, 5113.0, 1853.0, 882.0, 464.0, 228.0, 166.0, 106.0, 81.0, 54.0, 42.0, 23.0, 20.0, 19.0, 6.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.3359375, -7.09674072265625, -6.8575439453125, -6.61834716796875, -6.379150390625, -6.13995361328125, -5.9007568359375, -5.66156005859375, -5.42236328125, -5.18316650390625, -4.9439697265625, -4.70477294921875, -4.465576171875, -4.22637939453125, -3.9871826171875, -3.74798583984375, -3.5087890625, -3.26959228515625, -3.0303955078125, -2.79119873046875, -2.552001953125, -2.31280517578125, -2.0736083984375, -1.83441162109375, -1.59521484375, -1.35601806640625, -1.1168212890625, -0.87762451171875, -0.638427734375, -0.39923095703125, -0.1600341796875, 0.07916259765625, 0.318359375, 0.55755615234375, 0.7967529296875, 1.03594970703125, 1.275146484375, 1.51434326171875, 1.7535400390625, 1.99273681640625, 2.23193359375, 2.47113037109375, 2.7103271484375, 2.94952392578125, 3.188720703125, 3.42791748046875, 3.6671142578125, 3.90631103515625, 4.1455078125, 4.38470458984375, 4.6239013671875, 4.86309814453125, 5.102294921875, 5.34149169921875, 5.5806884765625, 5.81988525390625, 6.05908203125, 6.29827880859375, 6.5374755859375, 6.77667236328125, 7.015869140625, 7.25506591796875, 7.4942626953125, 7.73345947265625, 7.97265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 13.0, 8.0, 15.0, 20.0, 29.0, 30.0, 38.0, 57.0, 71.0, 68.0, 63.0, 81.0, 73.0, 79.0, 72.0, 55.0, 50.0, 42.0, 21.0, 24.0, 19.0, 17.0, 12.0, 11.0, 8.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.125, -16.6015625, -16.078125, -15.5546875, -15.03125, -14.5078125, -13.984375, -13.4609375, -12.9375, -12.4140625, -11.890625, -11.3671875, -10.84375, -10.3203125, -9.796875, -9.2734375, -8.75, -8.2265625, -7.703125, -7.1796875, -6.65625, -6.1328125, -5.609375, -5.0859375, -4.5625, -4.0390625, -3.515625, -2.9921875, -2.46875, -1.9453125, -1.421875, -0.8984375, -0.375, 0.1484375, 0.671875, 1.1953125, 1.71875, 2.2421875, 2.765625, 3.2890625, 3.8125, 4.3359375, 4.859375, 5.3828125, 5.90625, 6.4296875, 6.953125, 7.4765625, 8.0, 8.5234375, 9.046875, 9.5703125, 10.09375, 10.6171875, 11.140625, 11.6640625, 12.1875, 12.7109375, 13.234375, 13.7578125, 14.28125, 14.8046875, 15.328125, 15.8515625, 16.375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 5.0, 11.0, 18.0, 15.0, 31.0, 43.0, 59.0, 132.0, 213.0, 536.0, 1411.0, 4638.0, 21381.0, 182797.0, 778839.0, 46248.0, 8486.0, 2227.0, 707.0, 337.0, 159.0, 95.0, 55.0, 29.0, 27.0, 10.0, 12.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.634765625, -3.537078857421875, -3.43939208984375, -3.341705322265625, -3.2440185546875, -3.146331787109375, -3.04864501953125, -2.950958251953125, -2.853271484375, -2.755584716796875, -2.65789794921875, -2.560211181640625, -2.4625244140625, -2.364837646484375, -2.26715087890625, -2.169464111328125, -2.07177734375, -1.974090576171875, -1.87640380859375, -1.778717041015625, -1.6810302734375, -1.583343505859375, -1.48565673828125, -1.387969970703125, -1.290283203125, -1.192596435546875, -1.09490966796875, -0.997222900390625, -0.8995361328125, -0.801849365234375, -0.70416259765625, -0.606475830078125, -0.5087890625, -0.411102294921875, -0.31341552734375, -0.215728759765625, -0.1180419921875, -0.020355224609375, 0.07733154296875, 0.175018310546875, 0.272705078125, 0.370391845703125, 0.46807861328125, 0.565765380859375, 0.6634521484375, 0.761138916015625, 0.85882568359375, 0.956512451171875, 1.05419921875, 1.151885986328125, 1.24957275390625, 1.347259521484375, 1.4449462890625, 1.542633056640625, 1.64031982421875, 1.738006591796875, 1.835693359375, 1.933380126953125, 2.03106689453125, 2.128753662109375, 2.2264404296875, 2.324127197265625, 2.42181396484375, 2.519500732421875, 2.6171875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 0.0, 4.0, 10.0, 1.0, 8.0, 4.0, 6.0, 11.0, 8.0, 12.0, 21.0, 29.0, 32.0, 40.0, 68.0, 97.0, 134.0, 147.0, 91.0, 66.0, 56.0, 39.0, 19.0, 18.0, 18.0, 13.0, 6.0, 8.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005145072937011719, -0.0004939883947372437, -0.00047346949577331543, -0.0004529505968093872, -0.000432431697845459, -0.00041191279888153076, -0.00039139389991760254, -0.0003708750009536743, -0.0003503561019897461, -0.00032983720302581787, -0.00030931830406188965, -0.0002887994050979614, -0.0002682805061340332, -0.000247761607170105, -0.00022724270820617676, -0.00020672380924224854, -0.0001862049102783203, -0.0001656860113143921, -0.00014516711235046387, -0.00012464821338653564, -0.00010412931442260742, -8.36104154586792e-05, -6.309151649475098e-05, -4.2572617530822754e-05, -2.205371856689453e-05, -1.5348196029663086e-06, 1.8984079360961914e-05, 3.950297832489014e-05, 6.002187728881836e-05, 8.054077625274658e-05, 0.0001010596752166748, 0.00012157857418060303, 0.00014209747314453125, 0.00016261637210845947, 0.0001831352710723877, 0.00020365417003631592, 0.00022417306900024414, 0.00024469196796417236, 0.0002652108669281006, 0.0002857297658920288, 0.00030624866485595703, 0.00032676756381988525, 0.0003472864627838135, 0.0003678053617477417, 0.0003883242607116699, 0.00040884315967559814, 0.00042936205863952637, 0.0004498809576034546, 0.0004703998565673828, 0.000490918755531311, 0.0005114376544952393, 0.0005319565534591675, 0.0005524754524230957, 0.0005729943513870239, 0.0005935132503509521, 0.0006140321493148804, 0.0006345510482788086, 0.0006550699472427368, 0.000675588846206665, 0.0006961077451705933, 0.0007166266441345215, 0.0007371455430984497, 0.0007576644420623779, 0.0007781833410263062, 0.0007987022399902344]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 5.0, 11.0, 9.0, 13.0, 29.0, 26.0, 48.0, 57.0, 82.0, 138.0, 197.0, 305.0, 452.0, 791.0, 1437.0, 2776.0, 5754.0, 12820.0, 32735.0, 100976.0, 619332.0, 182703.0, 52236.0, 19125.0, 8037.0, 3821.0, 1914.0, 1034.0, 583.0, 354.0, 234.0, 144.0, 109.0, 66.0, 55.0, 35.0, 27.0, 16.0, 14.0, 10.0, 9.0, 8.0, 2.0, 1.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5224609375, -1.472900390625, -1.42333984375, -1.373779296875, -1.32421875, -1.274658203125, -1.22509765625, -1.175537109375, -1.1259765625, -1.076416015625, -1.02685546875, -0.977294921875, -0.927734375, -0.878173828125, -0.82861328125, -0.779052734375, -0.7294921875, -0.679931640625, -0.63037109375, -0.580810546875, -0.53125, -0.481689453125, -0.43212890625, -0.382568359375, -0.3330078125, -0.283447265625, -0.23388671875, -0.184326171875, -0.134765625, -0.085205078125, -0.03564453125, 0.013916015625, 0.0634765625, 0.113037109375, 0.16259765625, 0.212158203125, 0.26171875, 0.311279296875, 0.36083984375, 0.410400390625, 0.4599609375, 0.509521484375, 0.55908203125, 0.608642578125, 0.658203125, 0.707763671875, 0.75732421875, 0.806884765625, 0.8564453125, 0.906005859375, 0.95556640625, 1.005126953125, 1.0546875, 1.104248046875, 1.15380859375, 1.203369140625, 1.2529296875, 1.302490234375, 1.35205078125, 1.401611328125, 1.451171875, 1.500732421875, 1.55029296875, 1.599853515625, 1.6494140625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 4.0, 6.0, 3.0, 10.0, 17.0, 8.0, 10.0, 16.0, 24.0, 22.0, 27.0, 22.0, 39.0, 39.0, 38.0, 49.0, 74.0, 86.0, 66.0, 59.0, 38.0, 36.0, 47.0, 33.0, 25.0, 35.0, 32.0, 14.0, 20.0, 14.0, 8.0, 5.0, 5.0, 10.0, 7.0, 13.0, 2.0, 4.0, 2.0, 4.0, 3.0, 0.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.3818359375, -1.335845947265625, -1.28985595703125, -1.243865966796875, -1.1978759765625, -1.151885986328125, -1.10589599609375, -1.059906005859375, -1.013916015625, -0.967926025390625, -0.92193603515625, -0.875946044921875, -0.8299560546875, -0.783966064453125, -0.73797607421875, -0.691986083984375, -0.64599609375, -0.600006103515625, -0.55401611328125, -0.508026123046875, -0.4620361328125, -0.416046142578125, -0.37005615234375, -0.324066162109375, -0.278076171875, -0.232086181640625, -0.18609619140625, -0.140106201171875, -0.0941162109375, -0.048126220703125, -0.00213623046875, 0.043853759765625, 0.08984375, 0.135833740234375, 0.18182373046875, 0.227813720703125, 0.2738037109375, 0.319793701171875, 0.36578369140625, 0.411773681640625, 0.457763671875, 0.503753662109375, 0.54974365234375, 0.595733642578125, 0.6417236328125, 0.687713623046875, 0.73370361328125, 0.779693603515625, 0.82568359375, 0.871673583984375, 0.91766357421875, 0.963653564453125, 1.0096435546875, 1.055633544921875, 1.10162353515625, 1.147613525390625, 1.193603515625, 1.239593505859375, 1.28558349609375, 1.331573486328125, 1.3775634765625, 1.423553466796875, 1.46954345703125, 1.515533447265625, 1.5615234375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 8.0, 31.0, 92.0, 298.0, 431.0, 83.0, 25.0, 10.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.44937133789062, -132.5598602294922, -128.67034912109375, -124.78083801269531, -120.89132690429688, -117.00181579589844, -113.1123046875, -109.22279357910156, -105.33328247070312, -101.44377136230469, -97.55426025390625, -93.66474914550781, -89.77523803710938, -85.88572692871094, -81.9962158203125, -78.10670471191406, -74.21719360351562, -70.32768249511719, -66.43817138671875, -62.54866027832031, -58.659149169921875, -54.76963806152344, -50.880126953125, -46.99061584472656, -43.101104736328125, -39.21159362792969, -35.32208251953125, -31.432571411132812, -27.543060302734375, -23.653549194335938, -19.7640380859375, -15.874526977539062, -11.985008239746094, -8.095497131347656, -4.205986022949219, -0.31647491455078125, 3.5730361938476562, 7.462547302246094, 11.352058410644531, 15.241569519042969, 19.131080627441406, 23.020591735839844, 26.91010284423828, 30.79961395263672, 34.689125061035156, 38.578636169433594, 42.46814727783203, 46.35765838623047, 50.247169494628906, 54.136680603027344, 58.02619171142578, 61.91570281982422, 65.80521392822266, 69.6947250366211, 73.58423614501953, 77.47374725341797, 81.3632583618164, 85.25276947021484, 89.14228057861328, 93.03179168701172, 96.92130279541016, 100.8108139038086, 104.70032501220703, 108.58983612060547, 112.4793472290039]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 13.0, 17.0, 21.0, 24.0, 22.0, 24.0, 26.0, 34.0, 34.0, 31.0, 47.0, 140.0, 162.0, 80.0, 49.0, 31.0, 38.0, 40.0, 28.0, 31.0, 11.0, 20.0, 8.0, 13.0, 11.0, 8.0, 2.0, 3.0, 6.0, 4.0, 1.0, 2.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.35020446777344, -52.55244827270508, -50.75468826293945, -48.956932067871094, -47.159175872802734, -45.361419677734375, -43.56365966796875, -41.76590347290039, -39.96814727783203, -38.17039108276367, -36.37263107299805, -34.57487487792969, -32.77711868286133, -30.979360580444336, -29.181602478027344, -27.383846282958984, -25.586088180541992, -23.788330078125, -21.99057388305664, -20.19281578063965, -18.39505958557129, -16.597301483154297, -14.799544334411621, -13.001787185668945, -11.20403003692627, -9.406272888183594, -7.608515739440918, -5.810758113861084, -4.013000965118408, -2.215243339538574, -0.41748619079589844, 1.3802709579467773, 3.178028106689453, 4.975785255432129, 6.773542404174805, 8.571300506591797, 10.369056701660156, 12.166814804077148, 13.964571952819824, 15.7623291015625, 17.56008529663086, 19.35784339904785, 21.15559959411621, 22.953357696533203, 24.751113891601562, 26.548871994018555, 28.346630096435547, 30.144386291503906, 31.9421443939209, 33.73990249633789, 35.53765869140625, 37.33541488647461, 39.133174896240234, 40.930931091308594, 42.72868728637695, 44.52644348144531, 46.32420349121094, 48.1219596862793, 49.91971969604492, 51.71747589111328, 53.51523208618164, 55.31298828125, 57.110748291015625, 58.908504486083984, 60.706260681152344]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 0.0, 6.0, 5.0, 8.0, 10.0, 9.0, 27.0, 17.0, 29.0, 48.0, 51.0, 73.0, 148.0, 233.0, 422.0, 983.0, 2161.0, 6542.0, 24438.0, 145661.0, 1357810.0, 2308633.0, 293064.0, 39570.0, 9122.0, 2890.0, 1145.0, 477.0, 271.0, 141.0, 95.0, 55.0, 49.0, 29.0, 12.0, 17.0, 12.0, 10.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.359375, -7.1304931640625, -6.901611328125, -6.6727294921875, -6.44384765625, -6.2149658203125, -5.986083984375, -5.7572021484375, -5.5283203125, -5.2994384765625, -5.070556640625, -4.8416748046875, -4.61279296875, -4.3839111328125, -4.155029296875, -3.9261474609375, -3.697265625, -3.4683837890625, -3.239501953125, -3.0106201171875, -2.78173828125, -2.5528564453125, -2.323974609375, -2.0950927734375, -1.8662109375, -1.6373291015625, -1.408447265625, -1.1795654296875, -0.95068359375, -0.7218017578125, -0.492919921875, -0.2640380859375, -0.03515625, 0.1937255859375, 0.422607421875, 0.6514892578125, 0.88037109375, 1.1092529296875, 1.338134765625, 1.5670166015625, 1.7958984375, 2.0247802734375, 2.253662109375, 2.4825439453125, 2.71142578125, 2.9403076171875, 3.169189453125, 3.3980712890625, 3.626953125, 3.8558349609375, 4.084716796875, 4.3135986328125, 4.54248046875, 4.7713623046875, 5.000244140625, 5.2291259765625, 5.4580078125, 5.6868896484375, 5.915771484375, 6.1446533203125, 6.37353515625, 6.6024169921875, 6.831298828125, 7.0601806640625, 7.2890625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 7.0, 7.0, 9.0, 19.0, 23.0, 14.0, 21.0, 27.0, 33.0, 37.0, 41.0, 49.0, 46.0, 46.0, 53.0, 48.0, 52.0, 45.0, 51.0, 39.0, 56.0, 49.0, 38.0, 28.0, 21.0, 22.0, 17.0, 19.0, 16.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.37835693359375, -2.2879638671875, -2.19757080078125, -2.107177734375, -2.01678466796875, -1.9263916015625, -1.83599853515625, -1.74560546875, -1.65521240234375, -1.5648193359375, -1.47442626953125, -1.384033203125, -1.29364013671875, -1.2032470703125, -1.11285400390625, -1.0224609375, -0.93206787109375, -0.8416748046875, -0.75128173828125, -0.660888671875, -0.57049560546875, -0.4801025390625, -0.38970947265625, -0.29931640625, -0.20892333984375, -0.1185302734375, -0.02813720703125, 0.062255859375, 0.15264892578125, 0.2430419921875, 0.33343505859375, 0.423828125, 0.51422119140625, 0.6046142578125, 0.69500732421875, 0.785400390625, 0.87579345703125, 0.9661865234375, 1.05657958984375, 1.14697265625, 1.23736572265625, 1.3277587890625, 1.41815185546875, 1.508544921875, 1.59893798828125, 1.6893310546875, 1.77972412109375, 1.8701171875, 1.96051025390625, 2.0509033203125, 2.14129638671875, 2.231689453125, 2.32208251953125, 2.4124755859375, 2.50286865234375, 2.59326171875, 2.68365478515625, 2.7740478515625, 2.86444091796875, 2.954833984375, 3.04522705078125, 3.1356201171875, 3.22601318359375, 3.31640625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 12.0, 23.0, 56.0, 157.0, 858.0, 8470.0, 4175066.0, 8529.0, 849.0, 159.0, 59.0, 15.0, 11.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.3125, -56.1923828125, -54.072265625, -51.9521484375, -49.83203125, -47.7119140625, -45.591796875, -43.4716796875, -41.3515625, -39.2314453125, -37.111328125, -34.9912109375, -32.87109375, -30.7509765625, -28.630859375, -26.5107421875, -24.390625, -22.2705078125, -20.150390625, -18.0302734375, -15.91015625, -13.7900390625, -11.669921875, -9.5498046875, -7.4296875, -5.3095703125, -3.189453125, -1.0693359375, 1.05078125, 3.1708984375, 5.291015625, 7.4111328125, 9.53125, 11.6513671875, 13.771484375, 15.8916015625, 18.01171875, 20.1318359375, 22.251953125, 24.3720703125, 26.4921875, 28.6123046875, 30.732421875, 32.8525390625, 34.97265625, 37.0927734375, 39.212890625, 41.3330078125, 43.453125, 45.5732421875, 47.693359375, 49.8134765625, 51.93359375, 54.0537109375, 56.173828125, 58.2939453125, 60.4140625, 62.5341796875, 64.654296875, 66.7744140625, 68.89453125, 71.0146484375, 73.134765625, 75.2548828125, 77.375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 18.0, 24.0, 74.0, 200.0, 567.0, 1418.0, 1114.0, 457.0, 127.0, 51.0, 16.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.15625, -39.261474609375, -38.36669921875, -37.471923828125, -36.5771484375, -35.682373046875, -34.78759765625, -33.892822265625, -32.998046875, -32.103271484375, -31.20849609375, -30.313720703125, -29.4189453125, -28.524169921875, -27.62939453125, -26.734619140625, -25.83984375, -24.945068359375, -24.05029296875, -23.155517578125, -22.2607421875, -21.365966796875, -20.47119140625, -19.576416015625, -18.681640625, -17.786865234375, -16.89208984375, -15.997314453125, -15.1025390625, -14.207763671875, -13.31298828125, -12.418212890625, -11.5234375, -10.628662109375, -9.73388671875, -8.839111328125, -7.9443359375, -7.049560546875, -6.15478515625, -5.260009765625, -4.365234375, -3.470458984375, -2.57568359375, -1.680908203125, -0.7861328125, 0.108642578125, 1.00341796875, 1.898193359375, 2.79296875, 3.687744140625, 4.58251953125, 5.477294921875, 6.3720703125, 7.266845703125, 8.16162109375, 9.056396484375, 9.951171875, 10.845947265625, 11.74072265625, 12.635498046875, 13.5302734375, 14.425048828125, 15.31982421875, 16.214599609375, 17.109375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 12.0, 12.0, 11.0, 12.0, 23.0, 32.0, 45.0, 69.0, 108.0, 161.0, 137.0, 127.0, 80.0, 50.0, 26.0, 25.0, 15.0, 11.0, 7.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-121.10395050048828, -117.83964538574219, -114.5753402709961, -111.31103515625, -108.04672241210938, -104.78241729736328, -101.51811218261719, -98.2538070678711, -94.989501953125, -91.7251968383789, -88.46089172363281, -85.19657897949219, -81.9322738647461, -78.66796875, -75.4036636352539, -72.13935852050781, -68.87504577636719, -65.6107406616211, -62.346431732177734, -59.08212661743164, -55.81781768798828, -52.55351257324219, -49.289207458496094, -46.02490234375, -42.76059341430664, -39.49628829956055, -36.23197937011719, -32.967674255371094, -29.703367233276367, -26.43906021118164, -23.174755096435547, -19.91044807434082, -16.646141052246094, -13.381834030151367, -10.117527961730957, -6.853221893310547, -3.5889148712158203, -0.32460784912109375, 2.939697265625, 6.204004287719727, 9.468311309814453, 12.73261833190918, 15.99692440032959, 19.26123046875, 22.525537490844727, 25.789844512939453, 29.054149627685547, 32.318458557128906, 35.582763671875, 38.847068786621094, 42.11137771606445, 45.37568283081055, 48.639991760253906, 51.904296875, 55.168601989746094, 58.43290710449219, 61.69721603393555, 64.9615249633789, 68.225830078125, 71.4901351928711, 74.75444030761719, 78.01875305175781, 81.28305053710938, 84.54736328125, 87.8116683959961]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 10.0, 17.0, 20.0, 27.0, 28.0, 36.0, 62.0, 63.0, 91.0, 97.0, 69.0, 86.0, 66.0, 50.0, 45.0, 47.0, 36.0, 33.0, 27.0, 13.0, 10.0, 14.0, 6.0, 7.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.84820556640625, -81.82169342041016, -78.79518127441406, -75.76866912841797, -72.74215698242188, -69.71565246582031, -66.68913269042969, -63.662628173828125, -60.63611602783203, -57.60960388183594, -54.583091735839844, -51.55657958984375, -48.53007125854492, -45.50355911254883, -42.477046966552734, -39.450538635253906, -36.42402267456055, -33.39751052856445, -30.371000289916992, -27.3444881439209, -24.317977905273438, -21.291465759277344, -18.26495361328125, -15.238443374633789, -12.211931228637695, -9.185420036315918, -6.158908367156982, -3.132396697998047, -0.10588550567626953, 2.920625686645508, 5.947137832641602, 8.973648071289062, 12.000160217285156, 15.026671409606934, 18.05318260192871, 21.079694747924805, 24.106204986572266, 27.13271713256836, 30.159229278564453, 33.18573760986328, 36.212249755859375, 39.23876190185547, 42.26527404785156, 45.291786193847656, 48.318294525146484, 51.34480667114258, 54.37131881713867, 57.3978271484375, 60.42434310913086, 63.45085525512695, 66.47736358642578, 69.50387573242188, 72.53038787841797, 75.55690002441406, 78.58341217041016, 81.60992431640625, 84.63643646240234, 87.66294860839844, 90.68946075439453, 93.71597290039062, 96.74248504638672, 99.76899719238281, 102.79550170898438, 105.82201385498047, 108.84852600097656]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 12.0, 10.0, 14.0, 11.0, 25.0, 34.0, 53.0, 73.0, 141.0, 214.0, 396.0, 706.0, 1394.0, 2905.0, 6940.0, 18429.0, 59803.0, 256230.0, 525611.0, 122742.0, 32786.0, 11121.0, 4459.0, 2083.0, 1010.0, 559.0, 317.0, 184.0, 98.0, 80.0, 37.0, 33.0, 21.0, 7.0, 7.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5703125, -5.38623046875, -5.2021484375, -5.01806640625, -4.833984375, -4.64990234375, -4.4658203125, -4.28173828125, -4.09765625, -3.91357421875, -3.7294921875, -3.54541015625, -3.361328125, -3.17724609375, -2.9931640625, -2.80908203125, -2.625, -2.44091796875, -2.2568359375, -2.07275390625, -1.888671875, -1.70458984375, -1.5205078125, -1.33642578125, -1.15234375, -0.96826171875, -0.7841796875, -0.60009765625, -0.416015625, -0.23193359375, -0.0478515625, 0.13623046875, 0.3203125, 0.50439453125, 0.6884765625, 0.87255859375, 1.056640625, 1.24072265625, 1.4248046875, 1.60888671875, 1.79296875, 1.97705078125, 2.1611328125, 2.34521484375, 2.529296875, 2.71337890625, 2.8974609375, 3.08154296875, 3.265625, 3.44970703125, 3.6337890625, 3.81787109375, 4.001953125, 4.18603515625, 4.3701171875, 4.55419921875, 4.73828125, 4.92236328125, 5.1064453125, 5.29052734375, 5.474609375, 5.65869140625, 5.8427734375, 6.02685546875, 6.2109375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 0.0, 5.0, 6.0, 10.0, 6.0, 12.0, 10.0, 15.0, 20.0, 15.0, 28.0, 27.0, 37.0, 46.0, 33.0, 41.0, 56.0, 37.0, 58.0, 59.0, 56.0, 46.0, 38.0, 48.0, 44.0, 39.0, 40.0, 33.0, 25.0, 21.0, 22.0, 17.0, 9.0, 6.0, 7.0, 8.0, 2.0, 4.0, 5.0, 4.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.5234375, -4.38067626953125, -4.2379150390625, -4.09515380859375, -3.952392578125, -3.80963134765625, -3.6668701171875, -3.52410888671875, -3.38134765625, -3.23858642578125, -3.0958251953125, -2.95306396484375, -2.810302734375, -2.66754150390625, -2.5247802734375, -2.38201904296875, -2.2392578125, -2.09649658203125, -1.9537353515625, -1.81097412109375, -1.668212890625, -1.52545166015625, -1.3826904296875, -1.23992919921875, -1.09716796875, -0.95440673828125, -0.8116455078125, -0.66888427734375, -0.526123046875, -0.38336181640625, -0.2406005859375, -0.09783935546875, 0.044921875, 0.18768310546875, 0.3304443359375, 0.47320556640625, 0.615966796875, 0.75872802734375, 0.9014892578125, 1.04425048828125, 1.18701171875, 1.32977294921875, 1.4725341796875, 1.61529541015625, 1.758056640625, 1.90081787109375, 2.0435791015625, 2.18634033203125, 2.3291015625, 2.47186279296875, 2.6146240234375, 2.75738525390625, 2.900146484375, 3.04290771484375, 3.1856689453125, 3.32843017578125, 3.47119140625, 3.61395263671875, 3.7567138671875, 3.89947509765625, 4.042236328125, 4.18499755859375, 4.3277587890625, 4.47052001953125, 4.61328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 6.0, 16.0, 10.0, 26.0, 27.0, 45.0, 63.0, 101.0, 167.0, 366.0, 745.0, 2539.0, 13903.0, 296907.0, 711181.0, 17780.0, 2951.0, 836.0, 367.0, 208.0, 95.0, 67.0, 45.0, 22.0, 18.0, 11.0, 13.0, 6.0, 4.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.940185546875, -8.58349609375, -8.226806640625, -7.8701171875, -7.513427734375, -7.15673828125, -6.800048828125, -6.443359375, -6.086669921875, -5.72998046875, -5.373291015625, -5.0166015625, -4.659912109375, -4.30322265625, -3.946533203125, -3.58984375, -3.233154296875, -2.87646484375, -2.519775390625, -2.1630859375, -1.806396484375, -1.44970703125, -1.093017578125, -0.736328125, -0.379638671875, -0.02294921875, 0.333740234375, 0.6904296875, 1.047119140625, 1.40380859375, 1.760498046875, 2.1171875, 2.473876953125, 2.83056640625, 3.187255859375, 3.5439453125, 3.900634765625, 4.25732421875, 4.614013671875, 4.970703125, 5.327392578125, 5.68408203125, 6.040771484375, 6.3974609375, 6.754150390625, 7.11083984375, 7.467529296875, 7.82421875, 8.180908203125, 8.53759765625, 8.894287109375, 9.2509765625, 9.607666015625, 9.96435546875, 10.321044921875, 10.677734375, 11.034423828125, 11.39111328125, 11.747802734375, 12.1044921875, 12.461181640625, 12.81787109375, 13.174560546875, 13.53125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 9.0, 8.0, 8.0, 6.0, 14.0, 21.0, 20.0, 19.0, 12.0, 17.0, 18.0, 32.0, 38.0, 45.0, 36.0, 66.0, 91.0, 81.0, 88.0, 57.0, 54.0, 47.0, 33.0, 27.0, 30.0, 21.0, 11.0, 13.0, 18.0, 8.0, 12.0, 5.0, 7.0, 8.0, 6.0, 4.0, 5.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.25, -18.6982421875, -18.146484375, -17.5947265625, -17.04296875, -16.4912109375, -15.939453125, -15.3876953125, -14.8359375, -14.2841796875, -13.732421875, -13.1806640625, -12.62890625, -12.0771484375, -11.525390625, -10.9736328125, -10.421875, -9.8701171875, -9.318359375, -8.7666015625, -8.21484375, -7.6630859375, -7.111328125, -6.5595703125, -6.0078125, -5.4560546875, -4.904296875, -4.3525390625, -3.80078125, -3.2490234375, -2.697265625, -2.1455078125, -1.59375, -1.0419921875, -0.490234375, 0.0615234375, 0.61328125, 1.1650390625, 1.716796875, 2.2685546875, 2.8203125, 3.3720703125, 3.923828125, 4.4755859375, 5.02734375, 5.5791015625, 6.130859375, 6.6826171875, 7.234375, 7.7861328125, 8.337890625, 8.8896484375, 9.44140625, 9.9931640625, 10.544921875, 11.0966796875, 11.6484375, 12.2001953125, 12.751953125, 13.3037109375, 13.85546875, 14.4072265625, 14.958984375, 15.5107421875, 16.0625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 5.0, 7.0, 13.0, 10.0, 17.0, 25.0, 48.0, 59.0, 115.0, 169.0, 323.0, 608.0, 1325.0, 3122.0, 9334.0, 42332.0, 850191.0, 114736.0, 17291.0, 5004.0, 1883.0, 854.0, 432.0, 233.0, 162.0, 89.0, 62.0, 34.0, 24.0, 12.0, 13.0, 5.0, 9.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7919921875, -1.7372283935546875, -1.682464599609375, -1.6277008056640625, -1.57293701171875, -1.5181732177734375, -1.463409423828125, -1.4086456298828125, -1.3538818359375, -1.2991180419921875, -1.244354248046875, -1.1895904541015625, -1.13482666015625, -1.0800628662109375, -1.025299072265625, -0.9705352783203125, -0.915771484375, -0.8610076904296875, -0.806243896484375, -0.7514801025390625, -0.69671630859375, -0.6419525146484375, -0.587188720703125, -0.5324249267578125, -0.4776611328125, -0.4228973388671875, -0.368133544921875, -0.3133697509765625, -0.25860595703125, -0.2038421630859375, -0.149078369140625, -0.0943145751953125, -0.03955078125, 0.0152130126953125, 0.069976806640625, 0.1247406005859375, 0.17950439453125, 0.2342681884765625, 0.289031982421875, 0.3437957763671875, 0.3985595703125, 0.4533233642578125, 0.508087158203125, 0.5628509521484375, 0.61761474609375, 0.6723785400390625, 0.727142333984375, 0.7819061279296875, 0.836669921875, 0.8914337158203125, 0.946197509765625, 1.0009613037109375, 1.05572509765625, 1.1104888916015625, 1.165252685546875, 1.2200164794921875, 1.2747802734375, 1.3295440673828125, 1.384307861328125, 1.4390716552734375, 1.49383544921875, 1.5485992431640625, 1.603363037109375, 1.6581268310546875, 1.712890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 6.0, 7.0, 12.0, 14.0, 26.0, 23.0, 36.0, 68.0, 143.0, 185.0, 165.0, 113.0, 51.0, 36.0, 25.0, 17.0, 14.0, 10.0, 10.0, 10.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00055694580078125, -0.0005376413464546204, -0.0005183368921279907, -0.0004990324378013611, -0.00047972798347473145, -0.0004604235291481018, -0.00044111907482147217, -0.00042181462049484253, -0.0004025101661682129, -0.00038320571184158325, -0.0003639012575149536, -0.000344596803188324, -0.00032529234886169434, -0.0003059878945350647, -0.00028668344020843506, -0.0002673789858818054, -0.0002480745315551758, -0.00022877007722854614, -0.0002094656229019165, -0.00019016116857528687, -0.00017085671424865723, -0.0001515522599220276, -0.00013224780559539795, -0.00011294335126876831, -9.363889694213867e-05, -7.433444261550903e-05, -5.5029988288879395e-05, -3.5725533962249756e-05, -1.6421079635620117e-05, 2.8833746910095215e-06, 2.218782901763916e-05, 4.14922833442688e-05, 6.079673767089844e-05, 8.010119199752808e-05, 9.940564632415771e-05, 0.00011871010065078735, 0.000138014554977417, 0.00015731900930404663, 0.00017662346363067627, 0.0001959279179573059, 0.00021523237228393555, 0.00023453682661056519, 0.0002538412809371948, 0.00027314573526382446, 0.0002924501895904541, 0.00031175464391708374, 0.0003310590982437134, 0.000350363552570343, 0.00036966800689697266, 0.0003889724612236023, 0.00040827691555023193, 0.00042758136987686157, 0.0004468858242034912, 0.00046619027853012085, 0.0004854947328567505, 0.0005047991871833801, 0.0005241036415100098, 0.0005434080958366394, 0.000562712550163269, 0.0005820170044898987, 0.0006013214588165283, 0.000620625913143158, 0.0006399303674697876, 0.0006592348217964172, 0.0006785392761230469]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 11.0, 14.0, 19.0, 20.0, 32.0, 63.0, 89.0, 198.0, 378.0, 698.0, 1491.0, 3859.0, 10861.0, 38779.0, 745766.0, 204375.0, 27876.0, 8284.0, 3086.0, 1290.0, 570.0, 330.0, 176.0, 96.0, 61.0, 36.0, 25.0, 19.0, 13.0, 12.0, 7.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.541015625, -1.485748291015625, -1.43048095703125, -1.375213623046875, -1.3199462890625, -1.264678955078125, -1.20941162109375, -1.154144287109375, -1.098876953125, -1.043609619140625, -0.98834228515625, -0.933074951171875, -0.8778076171875, -0.822540283203125, -0.76727294921875, -0.712005615234375, -0.65673828125, -0.601470947265625, -0.54620361328125, -0.490936279296875, -0.4356689453125, -0.380401611328125, -0.32513427734375, -0.269866943359375, -0.214599609375, -0.159332275390625, -0.10406494140625, -0.048797607421875, 0.0064697265625, 0.061737060546875, 0.11700439453125, 0.172271728515625, 0.2275390625, 0.282806396484375, 0.33807373046875, 0.393341064453125, 0.4486083984375, 0.503875732421875, 0.55914306640625, 0.614410400390625, 0.669677734375, 0.724945068359375, 0.78021240234375, 0.835479736328125, 0.8907470703125, 0.946014404296875, 1.00128173828125, 1.056549072265625, 1.11181640625, 1.167083740234375, 1.22235107421875, 1.277618408203125, 1.3328857421875, 1.388153076171875, 1.44342041015625, 1.498687744140625, 1.553955078125, 1.609222412109375, 1.66448974609375, 1.719757080078125, 1.7750244140625, 1.830291748046875, 1.88555908203125, 1.940826416015625, 1.99609375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 4.0, 9.0, 9.0, 11.0, 10.0, 14.0, 9.0, 14.0, 21.0, 26.0, 35.0, 54.0, 66.0, 91.0, 116.0, 111.0, 101.0, 60.0, 45.0, 30.0, 28.0, 24.0, 17.0, 15.0, 13.0, 12.0, 13.0, 7.0, 6.0, 7.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.8984375, -1.8391265869140625, -1.779815673828125, -1.7205047607421875, -1.66119384765625, -1.6018829345703125, -1.542572021484375, -1.4832611083984375, -1.4239501953125, -1.3646392822265625, -1.305328369140625, -1.2460174560546875, -1.18670654296875, -1.1273956298828125, -1.068084716796875, -1.0087738037109375, -0.949462890625, -0.8901519775390625, -0.830841064453125, -0.7715301513671875, -0.71221923828125, -0.6529083251953125, -0.593597412109375, -0.5342864990234375, -0.4749755859375, -0.4156646728515625, -0.356353759765625, -0.2970428466796875, -0.23773193359375, -0.1784210205078125, -0.119110107421875, -0.0597991943359375, -0.00048828125, 0.0588226318359375, 0.118133544921875, 0.1774444580078125, 0.23675537109375, 0.2960662841796875, 0.355377197265625, 0.4146881103515625, 0.4739990234375, 0.5333099365234375, 0.592620849609375, 0.6519317626953125, 0.71124267578125, 0.7705535888671875, 0.829864501953125, 0.8891754150390625, 0.948486328125, 1.0077972412109375, 1.067108154296875, 1.1264190673828125, 1.18572998046875, 1.2450408935546875, 1.304351806640625, 1.3636627197265625, 1.4229736328125, 1.4822845458984375, 1.541595458984375, 1.6009063720703125, 1.66021728515625, 1.7195281982421875, 1.778839111328125, 1.8381500244140625, 1.8974609375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 14.0, 47.0, 279.0, 543.0, 78.0, 29.0, 12.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.1165313720703, -169.66519165039062, -164.2138671875, -158.7625274658203, -153.3112030029297, -147.85986328125, -142.40853881835938, -136.9571990966797, -131.505859375, -126.05452728271484, -120.60319519042969, -115.15185546875, -109.70053100585938, -104.24919128417969, -98.79785919189453, -93.34652709960938, -87.89520263671875, -82.4438705444336, -76.99253845214844, -71.54119873046875, -66.08987426757812, -60.6385383605957, -55.18720245361328, -49.735870361328125, -44.28453826904297, -38.83320617675781, -33.381874084472656, -27.930538177490234, -22.479206085205078, -17.027873992919922, -11.5765380859375, -6.125205993652344, -0.673858642578125, 4.777474403381348, 10.22880744934082, 15.68014144897461, 21.131473541259766, 26.582805633544922, 32.034141540527344, 37.4854736328125, 42.936805725097656, 48.38813781738281, 53.83946990966797, 59.29080581665039, 64.74214172363281, 70.19346618652344, 75.64480590820312, 81.09613800048828, 86.54747009277344, 91.9988021850586, 97.45013427734375, 102.90147399902344, 108.35279846191406, 113.80413818359375, 119.2554702758789, 124.70680236816406, 130.15814208984375, 135.60948181152344, 141.06080627441406, 146.51214599609375, 151.96347045898438, 157.41481018066406, 162.86614990234375, 168.31747436523438, 173.768798828125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 8.0, 6.0, 6.0, 7.0, 8.0, 22.0, 19.0, 23.0, 29.0, 32.0, 28.0, 102.0, 175.0, 196.0, 104.0, 29.0, 26.0, 24.0, 27.0, 16.0, 24.0, 18.0, 14.0, 12.0, 16.0, 9.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.95697021484375, -62.9290657043457, -60.901161193847656, -58.87325668334961, -56.84535217285156, -54.817447662353516, -52.78954315185547, -50.761634826660156, -48.733734130859375, -46.70582962036133, -44.67792510986328, -42.650020599365234, -40.62211608886719, -38.59421157836914, -36.566307067871094, -34.53839874267578, -32.510494232177734, -30.482589721679688, -28.45468521118164, -26.426780700683594, -24.398876190185547, -22.3709716796875, -20.34306526184082, -18.315160751342773, -16.287256240844727, -14.25935173034668, -12.231447219848633, -10.20354175567627, -8.175637245178223, -6.147732734680176, -4.1198272705078125, -2.0919227600097656, -0.06401824951171875, 1.9638864994049072, 3.991791248321533, 6.019696235656738, 8.047600746154785, 10.075505256652832, 12.103410720825195, 14.131315231323242, 16.15921974182129, 18.187124252319336, 20.215028762817383, 22.242935180664062, 24.27083969116211, 26.298744201660156, 28.326648712158203, 30.35455322265625, 32.3824577331543, 34.410362243652344, 36.43826675415039, 38.46617126464844, 40.494075775146484, 42.52198028564453, 44.549888610839844, 46.577789306640625, 48.60569763183594, 50.633602142333984, 52.66150665283203, 54.68941116333008, 56.717315673828125, 58.74522018432617, 60.77312469482422, 62.80103302001953, 64.82893371582031]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 8.0, 7.0, 20.0, 23.0, 23.0, 18.0, 38.0, 27.0, 45.0, 38.0, 65.0, 169.0, 182.0, 65.0, 43.0, 28.0, 34.0, 25.0, 26.0, 21.0, 14.0, 14.0, 7.0, 9.0, 2.0, 12.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.55078125, -5.3875732421875, -5.224365234375, -5.0611572265625, -4.89794921875, -4.7347412109375, -4.571533203125, -4.4083251953125, -4.2451171875, -4.0819091796875, -3.918701171875, -3.7554931640625, -3.59228515625, -3.4290771484375, -3.265869140625, -3.1026611328125, -2.939453125, -2.7762451171875, -2.613037109375, -2.4498291015625, -2.28662109375, -2.1234130859375, -1.960205078125, -1.7969970703125, -1.6337890625, -1.4705810546875, -1.307373046875, -1.1441650390625, -0.98095703125, -0.8177490234375, -0.654541015625, -0.4913330078125, -0.328125, -0.1649169921875, -0.001708984375, 0.1614990234375, 0.32470703125, 0.4879150390625, 0.651123046875, 0.8143310546875, 0.9775390625, 1.1407470703125, 1.303955078125, 1.4671630859375, 1.63037109375, 1.7935791015625, 1.956787109375, 2.1199951171875, 2.283203125, 2.4464111328125, 2.609619140625, 2.7728271484375, 2.93603515625, 3.0992431640625, 3.262451171875, 3.4256591796875, 3.5888671875, 3.7520751953125, 3.915283203125, 4.0784912109375, 4.24169921875, 4.4049072265625, 4.568115234375, 4.7313232421875, 4.89453125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 3.0, 4.0, 4.0, 11.0, 6.0, 10.0, 10.0, 20.0, 26.0, 37.0, 70.0, 133.0, 244.0, 550.0, 2244.0, 16168.0, 8350882.0, 14869.0, 2105.0, 614.0, 236.0, 117.0, 52.0, 46.0, 27.0, 20.0, 9.0, 10.0, 6.0, 9.0, 11.0, 7.0, 4.0, 9.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-51.43772888183594, -50.06536102294922, -48.6929931640625, -47.32062530517578, -45.94825744628906, -44.575889587402344, -43.203521728515625, -41.831153869628906, -40.45878601074219, -39.08641815185547, -37.71405029296875, -36.34168243408203, -34.96931457519531, -33.596946716308594, -32.224578857421875, -30.85221290588379, -29.479846954345703, -28.107479095458984, -26.735111236572266, -25.362743377685547, -23.990375518798828, -22.61800765991211, -21.245641708374023, -19.873273849487305, -18.500905990600586, -17.128538131713867, -15.756170272827148, -14.383803367614746, -13.011435508728027, -11.639067649841309, -10.266700744628906, -8.894332885742188, -7.521961212158203, -6.149593353271484, -4.777225971221924, -3.4048585891723633, -2.0324907302856445, -0.6601228713989258, 0.7122440338134766, 2.0846118927001953, 3.456979751586914, 4.829347610473633, 6.201714992523193, 7.574082374572754, 8.946450233459473, 10.318818092346191, 11.691184997558594, 13.063552856445312, 14.435920715332031, 15.80828857421875, 17.18065643310547, 18.553024291992188, 19.925392150878906, 21.297760009765625, 22.67012596130371, 24.04249382019043, 25.41486167907715, 26.787229537963867, 28.159597396850586, 29.531963348388672, 30.90433120727539, 32.27669906616211, 33.64906692504883, 35.02143478393555, 36.393802642822266]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 8.0, 5.0, 6.0, 4.0, 5.0, 2.0, 7.0, 3.0, 5.0, 3.0, 3.0, 6.0, 11.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.69510650634766, -66.27449035644531, -63.85386657714844, -61.43324661254883, -59.01262664794922, -56.59200668334961, -54.17138671875, -51.75076675415039, -49.33014678955078, -46.90952682495117, -44.48890686035156, -42.06828689575195, -39.647666931152344, -37.227046966552734, -34.806427001953125, -32.385807037353516, -29.965187072753906, -27.544567108154297, -25.123947143554688, -22.703327178955078, -20.28270721435547, -17.86208724975586, -15.44146728515625, -13.02084732055664, -10.600227355957031, -8.179607391357422, -5.7589874267578125, -3.338367462158203, -0.9177474975585938, 1.5028724670410156, 3.923492431640625, 6.344112396240234, 8.764739990234375, 11.185359954833984, 13.605979919433594, 16.026599884033203, 18.447219848632812, 20.867839813232422, 23.28845977783203, 25.70907974243164, 28.12969970703125, 30.55031967163086, 32.97093963623047, 35.39155960083008, 37.81217956542969, 40.2327995300293, 42.653419494628906, 45.074039459228516, 47.494659423828125, 49.915279388427734, 52.335899353027344, 54.75651931762695, 57.17713928222656, 59.59775924682617, 62.01837921142578, 64.43899536132812, 66.859619140625, 69.28024291992188, 71.70085906982422, 74.12147521972656, 76.54209899902344, 78.96272277832031, 81.38333892822266, 83.803955078125, 86.22457885742188]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 6.0, 11.0, 8.0, 8.0, 12.0, 24.0, 21.0, 29.0, 25.0, 41.0, 41.0, 58.0, 58.0, 60.0, 70.0, 79.0, 54.0, 43.0, 69.0, 47.0, 41.0, 44.0, 26.0, 22.0, 16.0, 18.0, 18.0, 13.0, 4.0, 5.0, 7.0, 3.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.306640625, -3.202789306640625, -3.09893798828125, -2.995086669921875, -2.8912353515625, -2.787384033203125, -2.68353271484375, -2.579681396484375, -2.475830078125, -2.371978759765625, -2.26812744140625, -2.164276123046875, -2.0604248046875, -1.956573486328125, -1.85272216796875, -1.748870849609375, -1.64501953125, -1.541168212890625, -1.43731689453125, -1.333465576171875, -1.2296142578125, -1.125762939453125, -1.02191162109375, -0.918060302734375, -0.814208984375, -0.710357666015625, -0.60650634765625, -0.502655029296875, -0.3988037109375, -0.294952392578125, -0.19110107421875, -0.087249755859375, 0.0166015625, 0.120452880859375, 0.22430419921875, 0.328155517578125, 0.4320068359375, 0.535858154296875, 0.63970947265625, 0.743560791015625, 0.847412109375, 0.951263427734375, 1.05511474609375, 1.158966064453125, 1.2628173828125, 1.366668701171875, 1.47052001953125, 1.574371337890625, 1.67822265625, 1.782073974609375, 1.88592529296875, 1.989776611328125, 2.0936279296875, 2.197479248046875, 2.30133056640625, 2.405181884765625, 2.509033203125, 2.612884521484375, 2.71673583984375, 2.820587158203125, 2.9244384765625, 3.028289794921875, 3.13214111328125, 3.235992431640625, 3.33984375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 14.0, 16.0, 25.0, 46.0, 45.0, 75.0, 115.0, 160.0, 307.0, 563.0, 1040.0, 1887.0, 3866.0, 8725.0, 19783.0, 46749.0, 110651.0, 166268.0, 94086.0, 38846.0, 16379.0, 7298.0, 3349.0, 1620.0, 880.0, 569.0, 333.0, 175.0, 131.0, 63.0, 60.0, 34.0, 35.0, 25.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.859375, -22.15380859375, -21.4482421875, -20.74267578125, -20.037109375, -19.33154296875, -18.6259765625, -17.92041015625, -17.21484375, -16.50927734375, -15.8037109375, -15.09814453125, -14.392578125, -13.68701171875, -12.9814453125, -12.27587890625, -11.5703125, -10.86474609375, -10.1591796875, -9.45361328125, -8.748046875, -8.04248046875, -7.3369140625, -6.63134765625, -5.92578125, -5.22021484375, -4.5146484375, -3.80908203125, -3.103515625, -2.39794921875, -1.6923828125, -0.98681640625, -0.28125, 0.42431640625, 1.1298828125, 1.83544921875, 2.541015625, 3.24658203125, 3.9521484375, 4.65771484375, 5.36328125, 6.06884765625, 6.7744140625, 7.47998046875, 8.185546875, 8.89111328125, 9.5966796875, 10.30224609375, 11.0078125, 11.71337890625, 12.4189453125, 13.12451171875, 13.830078125, 14.53564453125, 15.2412109375, 15.94677734375, 16.65234375, 17.35791015625, 18.0634765625, 18.76904296875, 19.474609375, 20.18017578125, 20.8857421875, 21.59130859375, 22.296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 1.0, 9.0, 10.0, 11.0, 16.0, 14.0, 23.0, 22.0, 36.0, 49.0, 43.0, 64.0, 81.0, 76.0, 88.0, 82.0, 71.0, 54.0, 55.0, 36.0, 32.0, 24.0, 16.0, 19.0, 18.0, 11.0, 11.0, 4.0, 7.0, 7.0, 2.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3984375, -5.23785400390625, -5.0772705078125, -4.91668701171875, -4.756103515625, -4.59552001953125, -4.4349365234375, -4.27435302734375, -4.11376953125, -3.95318603515625, -3.7926025390625, -3.63201904296875, -3.471435546875, -3.31085205078125, -3.1502685546875, -2.98968505859375, -2.8291015625, -2.66851806640625, -2.5079345703125, -2.34735107421875, -2.186767578125, -2.02618408203125, -1.8656005859375, -1.70501708984375, -1.54443359375, -1.38385009765625, -1.2232666015625, -1.06268310546875, -0.902099609375, -0.74151611328125, -0.5809326171875, -0.42034912109375, -0.259765625, -0.09918212890625, 0.0614013671875, 0.22198486328125, 0.382568359375, 0.54315185546875, 0.7037353515625, 0.86431884765625, 1.02490234375, 1.18548583984375, 1.3460693359375, 1.50665283203125, 1.667236328125, 1.82781982421875, 1.9884033203125, 2.14898681640625, 2.3095703125, 2.47015380859375, 2.6307373046875, 2.79132080078125, 2.951904296875, 3.11248779296875, 3.2730712890625, 3.43365478515625, 3.59423828125, 3.75482177734375, 3.9154052734375, 4.07598876953125, 4.236572265625, 4.39715576171875, 4.5577392578125, 4.71832275390625, 4.87890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 9.0, 6.0, 8.0, 16.0, 21.0, 34.0, 85.0, 134.0, 91.0, 57.0, 9.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.79833984375, -68.21504974365234, -66.63175964355469, -65.04846954345703, -63.46518325805664, -61.881893157958984, -60.298606872558594, -58.71531677246094, -57.13202667236328, -55.548736572265625, -53.96544647216797, -52.38216018676758, -50.79887008666992, -49.215579986572266, -47.632293701171875, -46.04900360107422, -44.46571350097656, -42.882423400878906, -41.29913330078125, -39.71584701538086, -38.1325569152832, -36.54926681518555, -34.965980529785156, -33.3826904296875, -31.799400329589844, -30.216110229492188, -28.632822036743164, -27.04953384399414, -25.466243743896484, -23.882953643798828, -22.299665451049805, -20.71637725830078, -19.13309097290039, -17.549800872802734, -15.966512680053711, -14.383223533630371, -12.799934387207031, -11.216645240783691, -9.633356094360352, -8.050066947937012, -6.466777801513672, -4.883488655090332, -3.300199508666992, -1.7169103622436523, -0.1336212158203125, 1.4496679306030273, 3.032957077026367, 4.616246223449707, 6.199535369873047, 7.782824516296387, 9.366113662719727, 10.949402809143066, 12.532691955566406, 14.115981101989746, 15.699270248413086, 17.28255844116211, 18.865848541259766, 20.449138641357422, 22.032426834106445, 23.61571502685547, 25.199005126953125, 26.78229522705078, 28.365583419799805, 29.948871612548828, 31.532161712646484]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 8.0, 13.0, 21.0, 46.0, 89.0, 97.0, 67.0, 48.0, 19.0, 12.0, 7.0, 9.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.716785430908203, -23.91179847717285, -23.106813430786133, -22.30182647705078, -21.496841430664062, -20.69185447692871, -19.88686752319336, -19.08188247680664, -18.27689552307129, -17.471908569335938, -16.66692352294922, -15.861936569213867, -15.056950569152832, -14.251964569091797, -13.446977615356445, -12.64199161529541, -11.837005615234375, -11.03201961517334, -10.227033615112305, -9.422046661376953, -8.617060661315918, -7.812074661254883, -7.0070881843566895, -6.202101707458496, -5.397115707397461, -4.592129707336426, -3.7871432304382324, -2.982156991958618, -2.177170753479004, -1.3721847534179688, -0.5671982765197754, 0.23778820037841797, 1.0427722930908203, 1.8477585315704346, 2.652744770050049, 3.457731008529663, 4.262717247009277, 5.0677032470703125, 5.872689723968506, 6.677676200866699, 7.482662200927734, 8.28764820098877, 9.092634201049805, 9.897621154785156, 10.702607154846191, 11.507593154907227, 12.312580108642578, 13.117566108703613, 13.922552108764648, 14.727538108825684, 15.532524108886719, 16.33751106262207, 17.142498016357422, 17.94748306274414, 18.752470016479492, 19.557456970214844, 20.362442016601562, 21.167428970336914, 21.972414016723633, 22.777400970458984, 23.582386016845703, 24.387372970581055, 25.192359924316406, 25.997344970703125, 26.802331924438477]}, "eval/loss": 0.7367066740989685, "eval/wer": 0.1332606108687029, "eval/runtime": 818.2808, "eval/samples_per_second": 3.229, "eval/steps_per_second": 0.405} \ No newline at end of file